Upload 8 files
Browse files- .gitattributes +4 -0
- doc_201_35-2012-0345-6765-LA93-0M50-E080.json +15 -0
- doc_201_35-2012-0345-6765-LA93-0M50-E080.png +3 -0
- doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.json +15 -0
- doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.png +3 -0
- doc_748_dota_v2_dota_v2_dota_v2_P11130.json +15 -0
- doc_748_dota_v2_dota_v2_dota_v2_P11130.png +3 -0
- doc_835_dota_v2_dota_v2_dota_v2_P8230.json +15 -0
- doc_835_dota_v2_dota_v2_dota_v2_P8230.png +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
doc_201_35-2012-0345-6765-LA93-0M50-E080.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
doc_748_dota_v2_dota_v2_dota_v2_P11130.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
doc_835_dota_v2_dota_v2_dota_v2_P8230.png filter=lfs diff=lfs merge=lfs -text
|
doc_201_35-2012-0345-6765-LA93-0M50-E080.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"doc_id": 201,
|
| 3 |
+
"input_media": "HRSCD/2012/35-2012-0345-6765-LA93-0M50-E080.tif",
|
| 4 |
+
"question": "In the town depicted in the lower right of the image, what is the position of the white rectangular shopping mall relative to the light blue pointed-roof building?",
|
| 5 |
+
"answer": "B",
|
| 6 |
+
"pred": "B",
|
| 7 |
+
"category": "Object spatial relationship",
|
| 8 |
+
"sub_category": "Object spatial relationship",
|
| 9 |
+
"has_bbox": false,
|
| 10 |
+
"dataset": "initiacms/XLRS-Bench-lite",
|
| 11 |
+
"source": "train/data-00004-of-00074.arrow",
|
| 12 |
+
"image_path": "D:\\PycharmProject\\postgraduate\\D_workspace\\dockerssh\\XLRS_qwen_2.5\\research\\xlrs-qwen25vl\\figures\\assets\\xlrs_cases\\doc_201_35-2012-0345-6765-LA93-0M50-E080.png",
|
| 13 |
+
"width": 10000,
|
| 14 |
+
"height": 10000
|
| 15 |
+
}
|
doc_201_35-2012-0345-6765-LA93-0M50-E080.png
ADDED
|
Git LFS Details
|
doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"doc_id": 232,
|
| 3 |
+
"input_media": "MiniFrance/44-2013-0375-6680-LA93-0M50-E080.jp2.tif",
|
| 4 |
+
"question": "In the image, where is the building with the cross-shaped roof located in relation to the green rectangular sports field in the upper left corner?",
|
| 5 |
+
"answer": "C",
|
| 6 |
+
"pred": "C",
|
| 7 |
+
"category": "Object spatial relationship",
|
| 8 |
+
"sub_category": "Object spatial relationship",
|
| 9 |
+
"has_bbox": false,
|
| 10 |
+
"dataset": "initiacms/XLRS-Bench-lite",
|
| 11 |
+
"source": "train/data-00005-of-00074.arrow",
|
| 12 |
+
"image_path": "D:\\PycharmProject\\postgraduate\\D_workspace\\dockerssh\\XLRS_qwen_2.5\\research\\xlrs-qwen25vl\\figures\\assets\\xlrs_cases\\doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.png",
|
| 13 |
+
"width": 10000,
|
| 14 |
+
"height": 10000
|
| 15 |
+
}
|
doc_232_44-2013-0375-6680-LA93-0M50-E080.jp2.png
ADDED
|
Git LFS Details
|
doc_748_dota_v2_dota_v2_dota_v2_P11130.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"doc_id": 748,
|
| 3 |
+
"input_media": "DOTA_v2_4096_4096/dota_v2_dota_v2_dota_v2_P11130.png",
|
| 4 |
+
"question": "How many boats are there in the entire picture?",
|
| 5 |
+
"answer": "B",
|
| 6 |
+
"pred": "D",
|
| 7 |
+
"category": "Counting",
|
| 8 |
+
"sub_category": "Overall counting",
|
| 9 |
+
"has_bbox": false,
|
| 10 |
+
"dataset": "initiacms/XLRS-Bench-lite",
|
| 11 |
+
"source": "train/data-00017-of-00074.arrow",
|
| 12 |
+
"image_path": "D:\\PycharmProject\\postgraduate\\D_workspace\\dockerssh\\XLRS_qwen_2.5\\research\\xlrs-qwen25vl\\figures\\assets\\xlrs_cases\\doc_748_dota_v2_dota_v2_dota_v2_P11130.png",
|
| 13 |
+
"width": 4097,
|
| 14 |
+
"height": 4096
|
| 15 |
+
}
|
doc_748_dota_v2_dota_v2_dota_v2_P11130.png
ADDED
|
Git LFS Details
|
doc_835_dota_v2_dota_v2_dota_v2_P8230.json
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"doc_id": 835,
|
| 3 |
+
"input_media": "DOTA_v2_4912_7360/dota_v2_dota_v2_dota_v2_P8230.png",
|
| 4 |
+
"question": "How many cars are there in the parking lot beneath the grassy area in the bottom right corner of the picture?",
|
| 5 |
+
"answer": "C",
|
| 6 |
+
"pred": "B",
|
| 7 |
+
"category": "Counting",
|
| 8 |
+
"sub_category": "Counting with complex reasoning",
|
| 9 |
+
"has_bbox": false,
|
| 10 |
+
"dataset": "initiacms/XLRS-Bench-lite",
|
| 11 |
+
"source": "train/data-00019-of-00074.arrow",
|
| 12 |
+
"image_path": "D:\\PycharmProject\\postgraduate\\D_workspace\\dockerssh\\XLRS_qwen_2.5\\research\\xlrs-qwen25vl\\figures\\assets\\xlrs_cases\\doc_835_dota_v2_dota_v2_dota_v2_P8230.png",
|
| 13 |
+
"width": 7360,
|
| 14 |
+
"height": 4912
|
| 15 |
+
}
|
doc_835_dota_v2_dota_v2_dota_v2_P8230.png
ADDED
|
Git LFS Details
|