Atlas-online-0310-2task-with-caption / scripts /qwen_vl_comparison_results.json
guoyb0's picture
Upload code snapshot (2task with caption)
95f6448 verified
{
"scenes": [
{
"scene": "scene-0234",
"sample_token": "3481dbfd65864925b4a4b2d6b7256d44",
"gt_objects": [
{
"category": "vehicle.car",
"mapped": "car",
"x": 427.464,
"y": 1618.483,
"z": 0.913,
"distance": 3.7,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 2108,
"size": [
1.988,
4.344,
1.721
]
},
{
"category": "movable_object.trafficcone",
"mapped": "traffic_cone",
"x": 427.81,
"y": 1626.405,
"z": 0.777,
"distance": 4.3,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 43,
"size": [
0.248,
0.183,
1.246
]
},
{
"category": "movable_object.trafficcone",
"mapped": "traffic_cone",
"x": 429.693,
"y": 1626.661,
"z": 0.898,
"distance": 4.8,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 52,
"size": [
0.343,
0.273,
1.258
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 432.449,
"y": 1619.73,
"z": 1.073,
"distance": 5.1,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 690,
"size": [
2.294,
4.912,
1.717
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 426.933,
"y": 1628.613,
"z": 0.865,
"distance": 6.5,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 111,
"size": [
0.567,
0.686,
1.617
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 427.123,
"y": 1629.371,
"z": 1.05,
"distance": 7.3,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 55,
"size": [
0.828,
1.04,
1.821
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 432.454,
"y": 1615.458,
"z": 0.884,
"distance": 8.1,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 319,
"size": [
1.832,
4.351,
1.501
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 439.547,
"y": 1609.757,
"z": 1.01,
"distance": 17.0,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 13,
"size": [
2.067,
4.909,
1.565
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 410.442,
"y": 1621.494,
"z": 1.573,
"distance": 17.5,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 382,
"size": [
2.972,
6.069,
3.386
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 419.673,
"y": 1639.798,
"z": 0.455,
"distance": 19.5,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 18,
"size": [
0.67,
0.502,
1.869
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 416.649,
"y": 1603.964,
"z": 0.993,
"distance": 21.4,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 4,
"size": [
0.718,
0.667,
1.821
]
},
{
"category": "vehicle.trailer",
"mapped": "trailer",
"x": 407.642,
"y": 1613.684,
"z": 1.864,
"distance": 22.0,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 735,
"size": [
3.246,
15.095,
4.02
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 413.961,
"y": 1604.956,
"z": 0.959,
"distance": 22.2,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 5,
"size": [
0.7,
0.725,
1.752
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 411.075,
"y": 1607.097,
"z": 1.045,
"distance": 22.6,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 7,
"size": [
0.715,
0.783,
1.725
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 445.462,
"y": 1607.555,
"z": 1.186,
"distance": 22.8,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 23,
"size": [
1.912,
4.895,
1.785
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 414.04,
"y": 1604.063,
"z": 0.965,
"distance": 22.8,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 5,
"size": [
0.631,
0.675,
1.766
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 410.752,
"y": 1606.373,
"z": 0.911,
"distance": 23.4,
"state": "stopped",
"visibility": "v40-60",
"lidar_pts": 3,
"size": [
0.718,
0.762,
1.557
]
},
{
"category": "vehicle.bus.rigid",
"mapped": "bus",
"x": 448.409,
"y": 1609.846,
"z": 1.814,
"distance": 23.9,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 41,
"size": [
2.69,
9.334,
2.634
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 439.589,
"y": 1595.06,
"z": 1.078,
"distance": 29.5,
"state": "moving",
"visibility": "v40-60",
"lidar_pts": 3,
"size": [
2.155,
4.467,
1.827
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 411.286,
"y": 1646.98,
"z": 0.13,
"distance": 29.9,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 15,
"size": [
1.786,
4.539,
1.495
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 399.19,
"y": 1612.587,
"z": 0.506,
"distance": 30.3,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.565,
0.479,
1.746
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 407.523,
"y": 1645.886,
"z": 0.398,
"distance": 31.3,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 4,
"size": [
0.691,
0.731,
1.581
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 408.157,
"y": 1646.551,
"z": 0.214,
"distance": 31.4,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 4,
"size": [
0.669,
0.727,
1.592
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 398.446,
"y": 1610.636,
"z": 0.479,
"distance": 31.7,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.634,
0.482,
1.794
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 408.491,
"y": 1647.128,
"z": 0.268,
"distance": 31.7,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 4,
"size": [
0.704,
0.689,
1.721
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 395.447,
"y": 1634.657,
"z": 0.983,
"distance": 34.8,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 2,
"size": [
0.564,
0.479,
1.696
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 439.617,
"y": 1589.28,
"z": 1.122,
"distance": 34.9,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
0.613,
0.534,
1.794
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 394.111,
"y": 1630.848,
"z": 0.159,
"distance": 35.0,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
1.861,
4.589,
1.447
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 390.143,
"y": 1629.902,
"z": 0.446,
"distance": 38.6,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 4,
"size": [
2.025,
4.409,
1.627
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 429.514,
"y": 1660.955,
"z": 0.373,
"distance": 38.8,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 9,
"size": [
2.021,
4.582,
2.0
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 459.926,
"y": 1597.974,
"z": 2.161,
"distance": 40.1,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 19,
"size": [
2.939,
8.306,
3.607
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 445.619,
"y": 1586.03,
"z": 1.291,
"distance": 40.2,
"state": "moving",
"visibility": "v40-60",
"lidar_pts": 1,
"size": [
0.551,
0.575,
1.917
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 397.851,
"y": 1651.527,
"z": 0.664,
"distance": 42.1,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
0.845,
0.827,
1.862
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 387.941,
"y": 1635.636,
"z": 0.369,
"distance": 42.2,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
1.888,
4.65,
1.473
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 398.279,
"y": 1652.179,
"z": 0.697,
"distance": 42.2,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 2,
"size": [
0.835,
0.833,
1.793
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 385.925,
"y": 1633.284,
"z": 0.538,
"distance": 43.5,
"state": "stopped",
"visibility": "v40-60",
"lidar_pts": 3,
"size": [
1.862,
4.333,
1.689
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 433.131,
"y": 1667.552,
"z": 0.262,
"distance": 45.7,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 11,
"size": [
2.176,
5.471,
1.859
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 406.278,
"y": 1668.853,
"z": 0.523,
"distance": 51.5,
"state": "stopped",
"visibility": "v40-60",
"lidar_pts": 2,
"size": [
0.71,
0.694,
2.022
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 456.56,
"y": 1577.648,
"z": 1.394,
"distance": 52.9,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
1.244,
1.118,
1.876
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 377.328,
"y": 1638.298,
"z": 1.061,
"distance": 53.2,
"state": "stopped",
"visibility": "v40-60",
"lidar_pts": 4,
"size": [
2.846,
8.222,
3.287
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 421.7,
"y": 1675.625,
"z": 0.151,
"distance": 53.8,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 3,
"size": [
0.824,
0.953,
1.623
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 420.551,
"y": 1675.756,
"z": 0.385,
"distance": 54.1,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 3,
"size": [
0.964,
0.964,
1.752
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 374.157,
"y": 1631.782,
"z": 0.681,
"distance": 54.7,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 2,
"size": [
0.589,
0.733,
1.759
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 460.62,
"y": 1576.308,
"z": 1.476,
"distance": 56.3,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.891,
0.806,
1.794
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 439.354,
"y": 1679.899,
"z": 0.205,
"distance": 58.9,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
2.059,
4.396,
1.753
]
},
{
"category": "vehicle.trailer",
"mapped": "trailer",
"x": 369.485,
"y": 1643.275,
"z": 0.702,
"distance": 62.2,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 6,
"size": [
3.137,
11.647,
3.912
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 365.823,
"y": 1650.429,
"z": 1.143,
"distance": 68.3,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 6,
"size": [
2.473,
5.796,
2.606
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 367.729,
"y": 1656.274,
"z": 1.531,
"distance": 69.2,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 6,
"size": [
2.751,
6.985,
3.284
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 387.134,
"y": 1565.191,
"z": 0.92,
"distance": 70.1,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 2,
"size": [
2.803,
8.122,
3.149
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 371.278,
"y": 1559.5,
"z": 0.449,
"distance": 84.5,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
1.98,
4.762,
2.239
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 369.149,
"y": 1560.764,
"z": 0.44,
"distance": 85.0,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 3,
"size": [
1.988,
4.952,
2.115
]
},
{
"category": "vehicle.bus.rigid",
"mapped": "bus",
"x": 343.45,
"y": 1679.443,
"z": 1.26,
"distance": 102.1,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 4,
"size": [
2.791,
6.517,
2.749
]
}
],
"ego_pos": [
427.96858346929594,
1622.1558281210846
]
},
{
"scene": "scene-0044",
"sample_token": "1dda3d57404f4057af294145ba7332f6",
"gt_objects": [
{
"category": "vehicle.bicycle",
"mapped": "bicycle",
"x": 1002.021,
"y": 1102.115,
"z": 1.285,
"distance": 13.4,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 17,
"size": [
0.53,
1.749,
1.095
]
},
{
"category": "vehicle.bicycle",
"mapped": "bicycle",
"x": 999.524,
"y": 1100.21,
"z": 1.298,
"distance": 16.3,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
0.537,
1.727,
1.051
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1018.553,
"y": 1133.448,
"z": 1.337,
"distance": 28.1,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 2,
"size": [
0.334,
0.455,
1.528
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1017.687,
"y": 1133.831,
"z": 1.515,
"distance": 28.4,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
0.338,
0.381,
1.628
]
},
{
"category": "movable_object.pushable_pullable",
"mapped": "other",
"x": 993.512,
"y": 1085.029,
"z": 1.12,
"distance": 29.7,
"state": "unknown",
"visibility": "v0-40",
"lidar_pts": 3,
"size": [
0.79,
1.115,
1.164
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1081.921,
"y": 1085.923,
"z": 3.354,
"distance": 69.8,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
2.326,
4.674,
2.0
]
}
],
"ego_pos": [
1014.9514449951934,
1105.5630385088111
]
},
{
"scene": "scene-0566",
"sample_token": "2f78c87a92c540bcabec15760024bc20",
"gt_objects": [
{
"category": "vehicle.car",
"mapped": "car",
"x": 1329.961,
"y": 862.728,
"z": 1.093,
"distance": 8.3,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 366,
"size": [
1.84,
4.491,
1.502
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1334.047,
"y": 856.914,
"z": 1.234,
"distance": 10.0,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 106,
"size": [
1.859,
4.53,
1.599
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1327.046,
"y": 864.472,
"z": 1.037,
"distance": 10.6,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 81,
"size": [
1.79,
4.449,
1.72
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1324.321,
"y": 866.715,
"z": 1.283,
"distance": 13.1,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 94,
"size": [
1.981,
4.866,
1.898
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1338.764,
"y": 851.608,
"z": 1.018,
"distance": 14.7,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 32,
"size": [
2.122,
4.882,
1.856
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1321.807,
"y": 869.381,
"z": 1.268,
"distance": 15.9,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 12,
"size": [
1.945,
4.572,
1.725
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1354.215,
"y": 870.862,
"z": 0.618,
"distance": 17.4,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 8,
"size": [
1.889,
4.127,
1.542
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1328.273,
"y": 850.809,
"z": 1.305,
"distance": 18.0,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
1.943,
4.524,
1.942
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1335.268,
"y": 847.822,
"z": 0.843,
"distance": 18.6,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 42,
"size": [
2.104,
4.67,
1.591
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1357.726,
"y": 875.356,
"z": 0.743,
"distance": 22.2,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
1.99,
4.384,
1.815
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1316.356,
"y": 874.537,
"z": 1.305,
"distance": 22.6,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 20,
"size": [
1.827,
4.508,
1.707
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1331.19,
"y": 843.025,
"z": 1.214,
"distance": 24.1,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
1.998,
4.902,
1.859
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1314.324,
"y": 876.156,
"z": 1.304,
"distance": 25.1,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 4,
"size": [
1.844,
4.588,
1.86
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1363.401,
"y": 865.505,
"z": 0.773,
"distance": 26.0,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 17,
"size": [
1.928,
4.454,
1.766
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1312.699,
"y": 856.315,
"z": 1.293,
"distance": 26.7,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 2,
"size": [
2.141,
4.848,
1.918
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1320.184,
"y": 889.385,
"z": 1.3,
"distance": 28.8,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 13,
"size": [
2.004,
4.247,
1.573
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1321.302,
"y": 842.315,
"z": 1.733,
"distance": 28.9,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
2.183,
4.568,
1.843
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1309.414,
"y": 858.684,
"z": 1.813,
"distance": 29.0,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 6,
"size": [
2.113,
4.404,
1.643
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1366.407,
"y": 869.558,
"z": 0.658,
"distance": 29.1,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 10,
"size": [
1.773,
4.466,
1.5
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1364.427,
"y": 855.127,
"z": 0.619,
"distance": 29.2,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 11,
"size": [
2.074,
4.505,
1.629
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1310.371,
"y": 852.864,
"z": 1.129,
"distance": 30.2,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 7,
"size": [
1.866,
3.919,
1.741
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1362.37,
"y": 848.459,
"z": 1.034,
"distance": 30.6,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 10,
"size": [
1.927,
4.744,
2.0
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1351.551,
"y": 836.449,
"z": 1.467,
"distance": 33.0,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
1.942,
4.834,
1.664
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1369.88,
"y": 873.707,
"z": 0.647,
"distance": 33.3,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 18,
"size": [
1.912,
4.223,
1.814
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1371.571,
"y": 855.282,
"z": 0.523,
"distance": 35.9,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
1.858,
4.376,
1.606
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1346.005,
"y": 831.275,
"z": 1.641,
"distance": 36.0,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 14,
"size": [
2.022,
4.596,
1.837
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1373.109,
"y": 878.068,
"z": 0.948,
"distance": 37.6,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 2,
"size": [
1.866,
4.174,
1.822
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1303.378,
"y": 847.894,
"z": 1.166,
"distance": 38.7,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 3,
"size": [
1.696,
4.066,
1.889
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1339.858,
"y": 825.244,
"z": 1.015,
"distance": 41.1,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
2.133,
4.626,
1.613
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1364.933,
"y": 834.452,
"z": 1.217,
"distance": 42.1,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 2,
"size": [
2.371,
5.016,
1.814
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 1307.379,
"y": 900.066,
"z": 2.377,
"distance": 45.2,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 30,
"size": [
3.121,
6.604,
3.311
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1352.949,
"y": 821.897,
"z": 1.951,
"distance": 47.0,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 12,
"size": [
2.379,
5.738,
2.222
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1369.991,
"y": 830.561,
"z": 1.478,
"distance": 48.3,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 1,
"size": [
2.322,
5.402,
2.0
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1379.637,
"y": 822.578,
"z": 1.898,
"distance": 60.8,
"state": "parked",
"visibility": "v60-80",
"lidar_pts": 6,
"size": [
2.554,
5.781,
2.224
]
},
{
"category": "vehicle.bus.rigid",
"mapped": "bus",
"x": 1279.0,
"y": 913.315,
"z": 3.074,
"distance": 75.0,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 10,
"size": [
2.786,
8.936,
3.308
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1270.859,
"y": 930.252,
"z": 2.875,
"distance": 92.3,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
2.149,
4.485,
1.842
]
}
],
"ego_pos": [
1337.4419585730511,
866.2908294672284
]
},
{
"scene": "scene-0103",
"sample_token": "3e8750f331d7499e9b5123e9eb70f2e2",
"gt_objects": [
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 598.103,
"y": 1642.075,
"z": 1.029,
"distance": 5.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 68,
"size": [
0.631,
0.61,
1.929
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 597.73,
"y": 1641.374,
"z": 0.993,
"distance": 6.6,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 9,
"size": [
0.712,
0.601,
1.891
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 583.549,
"y": 1656.391,
"z": 1.267,
"distance": 18.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 34,
"size": [
1.871,
4.488,
1.515
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 619.03,
"y": 1648.941,
"z": 0.413,
"distance": 19.0,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 9,
"size": [
0.578,
0.613,
1.752
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 612.719,
"y": 1632.142,
"z": 0.491,
"distance": 19.9,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 7,
"size": [
0.688,
0.944,
1.904
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 602.152,
"y": 1626.301,
"z": 0.234,
"distance": 21.3,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 3,
"size": [
0.489,
0.491,
1.851
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 622.249,
"y": 1646.081,
"z": 0.321,
"distance": 22.2,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 9,
"size": [
0.697,
0.498,
1.761
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 582.374,
"y": 1660.997,
"z": 1.38,
"distance": 22.3,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 40,
"size": [
2.037,
4.958,
1.639
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 582.275,
"y": 1668.561,
"z": 1.473,
"distance": 27.6,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 6,
"size": [
0.908,
1.109,
2.211
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 619.603,
"y": 1624.655,
"z": 0.071,
"distance": 30.0,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
0.665,
0.736,
1.89
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 631.807,
"y": 1644.622,
"z": -0.459,
"distance": 31.8,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 3,
"size": [
0.738,
0.783,
1.52
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 622.35,
"y": 1624.018,
"z": -0.016,
"distance": 32.3,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
0.751,
1.03,
1.975
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 631.815,
"y": 1636.973,
"z": 0.074,
"distance": 33.4,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 4,
"size": [
0.612,
0.736,
1.877
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 637.141,
"y": 1636.252,
"z": -0.235,
"distance": 38.7,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.621,
0.647,
1.778
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 637.791,
"y": 1636.674,
"z": -0.011,
"distance": 39.2,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
0.699,
0.738,
1.95
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 627.008,
"y": 1617.877,
"z": -0.387,
"distance": 40.0,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 2,
"size": [
0.546,
0.439,
1.622
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 640.863,
"y": 1643.013,
"z": -0.285,
"distance": 41.0,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.64,
0.395,
1.807
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 635.378,
"y": 1674.253,
"z": -0.163,
"distance": 44.3,
"state": "moving",
"visibility": "v40-60",
"lidar_pts": 4,
"size": [
0.909,
1.105,
2.0
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 635.447,
"y": 1620.546,
"z": -0.326,
"distance": 44.4,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 4,
"size": [
2.001,
4.734,
1.481
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 636.797,
"y": 1680.132,
"z": -0.198,
"distance": 49.1,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 3,
"size": [
0.755,
1.235,
2.083
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 650.737,
"y": 1625.23,
"z": -0.3,
"distance": 55.3,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
0.585,
0.681,
1.711
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 639.585,
"y": 1606.675,
"z": -0.122,
"distance": 56.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
0.724,
0.828,
1.835
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 660.851,
"y": 1604.404,
"z": -0.423,
"distance": 74.5,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
1.803,
4.495,
1.56
]
}
],
"ego_pos": [
600.1202137947669,
1647.490776275174
]
},
{
"scene": "scene-0553",
"sample_token": "8687ba92abd3406aa797115b874ebeba",
"gt_objects": [
{
"category": "vehicle.car",
"mapped": "car",
"x": 1313.096,
"y": 1036.989,
"z": 0.652,
"distance": 3.7,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 2445,
"size": [
1.861,
4.554,
1.473
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1321.516,
"y": 1033.801,
"z": 1.008,
"distance": 7.0,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 473,
"size": [
1.979,
4.782,
1.954
]
},
{
"category": "vehicle.truck",
"mapped": "truck",
"x": 1319.41,
"y": 1031.387,
"z": 1.821,
"distance": 7.8,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 1389,
"size": [
2.339,
6.418,
3.964
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1326.916,
"y": 1029.509,
"z": 0.897,
"distance": 13.9,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 0,
"size": [
1.991,
4.562,
1.494
]
},
{
"category": "vehicle.trailer",
"mapped": "trailer",
"x": 1325.647,
"y": 1026.158,
"z": 1.972,
"distance": 15.5,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 335,
"size": [
2.33,
14.01,
3.889
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1330.066,
"y": 1046.334,
"z": 0.969,
"distance": 15.7,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 50,
"size": [
3.034,
0.395,
0.94
]
},
{
"category": "vehicle.bicycle",
"mapped": "bicycle",
"x": 1308.987,
"y": 1052.606,
"z": 1.402,
"distance": 15.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 26,
"size": [
0.525,
1.622,
1.696
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1331.484,
"y": 1043.453,
"z": 0.76,
"distance": 15.9,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 25,
"size": [
3.025,
0.396,
1.021
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1328.982,
"y": 1049.561,
"z": 1.089,
"distance": 16.7,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 24,
"size": [
3.062,
0.416,
0.979
]
},
{
"category": "movable_object.pushable_pullable",
"mapped": "other",
"x": 1299.491,
"y": 1037.485,
"z": 0.277,
"distance": 16.9,
"state": "unknown",
"visibility": "v0-40",
"lidar_pts": 1,
"size": [
0.466,
0.689,
0.842
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1333.186,
"y": 1040.597,
"z": 0.635,
"distance": 16.9,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 35,
"size": [
2.884,
0.422,
0.972
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1298.941,
"y": 1037.322,
"z": 0.569,
"distance": 17.5,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 3,
"size": [
0.612,
0.798,
1.56
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1298.993,
"y": 1034.258,
"z": 0.529,
"distance": 17.9,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 13,
"size": [
0.692,
0.756,
1.752
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1328.425,
"y": 1052.566,
"z": 1.31,
"distance": 18.4,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 21,
"size": [
2.905,
0.44,
0.92
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1335.042,
"y": 1037.999,
"z": 0.407,
"distance": 18.7,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 31,
"size": [
3.118,
0.413,
0.916
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1297.217,
"y": 1034.028,
"z": 0.358,
"distance": 19.7,
"state": "moving",
"visibility": "v60-80",
"lidar_pts": 5,
"size": [
0.567,
0.882,
1.627
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1337.482,
"y": 1035.208,
"z": 0.186,
"distance": 21.4,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 24,
"size": [
3.586,
0.413,
0.973
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1295.022,
"y": 1034.275,
"z": 0.416,
"distance": 21.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 10,
"size": [
0.921,
1.027,
1.909
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1295.125,
"y": 1032.757,
"z": 0.415,
"distance": 22.0,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 7,
"size": [
0.677,
0.834,
1.658
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1293.229,
"y": 1033.246,
"z": 0.388,
"distance": 23.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 3,
"size": [
0.715,
0.935,
1.682
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1340.124,
"y": 1032.575,
"z": 0.154,
"distance": 24.5,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 20,
"size": [
3.28,
0.533,
0.91
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1292.802,
"y": 1030.629,
"z": 0.465,
"distance": 24.9,
"state": "moving",
"visibility": "v0-40",
"lidar_pts": 5,
"size": [
0.552,
0.918,
1.739
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1342.828,
"y": 1030.123,
"z": -0.019,
"distance": 27.8,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 7,
"size": [
3.277,
0.535,
0.909
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1345.406,
"y": 1027.941,
"z": -0.246,
"distance": 30.9,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
3.284,
0.522,
0.91
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1283.16,
"y": 1030.691,
"z": 0.359,
"distance": 34.1,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 0,
"size": [
2.029,
4.686,
1.569
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1351.279,
"y": 1022.468,
"z": 0.048,
"distance": 38.4,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 2,
"size": [
3.277,
0.533,
0.957
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1277.031,
"y": 1033.186,
"z": 0.322,
"distance": 39.7,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 7,
"size": [
2.03,
4.717,
1.387
]
},
{
"category": "vehicle.bus.rigid",
"mapped": "bus",
"x": 1274.791,
"y": 1021.332,
"z": 0.905,
"distance": 45.0,
"state": "stopped",
"visibility": "v0-40",
"lidar_pts": 4,
"size": [
2.557,
7.407,
2.811
]
},
{
"category": "vehicle.bus.rigid",
"mapped": "bus",
"x": 1269.546,
"y": 1024.852,
"z": 1.042,
"distance": 48.8,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 8,
"size": [
2.725,
9.584,
3.172
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1277.91,
"y": 1072.348,
"z": 0.912,
"distance": 51.2,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 0,
"size": [
0.547,
0.718,
1.325
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1331.381,
"y": 1089.942,
"z": 3.241,
"distance": 53.5,
"state": "stopped",
"visibility": "v60-80",
"lidar_pts": 7,
"size": [
2.016,
4.752,
1.758
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1365.108,
"y": 1014.952,
"z": 0.254,
"distance": 54.2,
"state": "parked",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
2.02,
4.59,
1.687
]
},
{
"category": "movable_object.barrier",
"mapped": "barrier",
"x": 1273.894,
"y": 1072.524,
"z": 0.908,
"distance": 54.4,
"state": "unknown",
"visibility": "v80-100",
"lidar_pts": 0,
"size": [
2.902,
0.488,
0.944
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1334.824,
"y": 1094.85,
"z": 3.199,
"distance": 59.2,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 5,
"size": [
1.971,
4.574,
1.499
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1257.186,
"y": 1029.02,
"z": 0.276,
"distance": 60.0,
"state": "parked",
"visibility": "v0-40",
"lidar_pts": 2,
"size": [
2.01,
4.529,
1.704
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1340.58,
"y": 1102.095,
"z": 3.358,
"distance": 68.0,
"state": "stopped",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
2.17,
4.756,
1.917
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1241.295,
"y": 1063.646,
"z": 1.156,
"distance": 79.2,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 1,
"size": [
0.681,
0.708,
1.986
]
},
{
"category": "human.pedestrian.adult",
"mapped": "pedestrian",
"x": 1242.387,
"y": 1096.596,
"z": 1.312,
"distance": 94.0,
"state": "moving",
"visibility": "v40-60",
"lidar_pts": 0,
"size": [
0.673,
0.639,
1.821
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1184.486,
"y": 1119.001,
"z": 2.366,
"distance": 154.5,
"state": "moving",
"visibility": "v40-60",
"lidar_pts": 0,
"size": [
2.217,
4.734,
1.981
]
},
{
"category": "vehicle.car",
"mapped": "car",
"x": 1181.87,
"y": 1122.359,
"z": 2.116,
"distance": 158.5,
"state": "moving",
"visibility": "v80-100",
"lidar_pts": 0,
"size": [
2.176,
4.746,
1.748
]
}
],
"ego_pos": [
1316.3781762981437,
1038.5936681848448
]
}
],
"results": [
{
"model": "qwen-vl-max-latest",
"scene": "scene-0234",
"parsed": {
"vehicles": [
{
"type": "truck",
"color": "white",
"position": "front-left",
"distance_m": 10,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "front",
"distance_m": 30,
"state": "moving"
},
{
"type": "car",
"color": "gray",
"position": "back",
"distance_m": 5,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 8,
"state": "moving"
},
{
"type": "car",
"color": "black",
"position": "back-right",
"distance_m": 6,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "front-right",
"distance_m": 25,
"state": "parked"
},
{
"type": "car",
"color": "black",
"position": "front-right",
"distance_m": 20,
"state": "parked"
}
],
"pedestrians": [
{
"position": "front-right",
"distance_m": 12,
"state": "moving"
},
{
"position": "front-right",
"distance_m": 15,
"state": "moving"
},
{
"position": "front-left",
"distance_m": 25,
"state": "moving"
},
{
"position": "back-left",
"distance_m": 30,
"state": "moving"
}
],
"cyclists": [],
"traffic_signs": [
{
"text": "STOP",
"position": "front-right"
},
{
"text": "NO TURN ON RED",
"position": "front-right"
}
],
"traffic_cones": {
"count": 2
},
"barriers": {
"count": 4
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 456,
"latency": 20.6,
"error": null
},
{
"model": "qwen-vl-max-latest",
"scene": "scene-0044",
"parsed": {
"vehicles": [],
"pedestrians": [],
"cyclists": [
{
"position": "front-right",
"distance_m": 15
}
],
"traffic_signs": [
{
"text": "SCHOOL",
"position": "front"
},
{
"text": "STOP",
"position": "back"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 144,
"latency": 12.1,
"error": null
},
{
"model": "qwen-vl-max-latest",
"scene": "scene-0566",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "black",
"position": "front",
"distance_m": 25,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "front",
"distance_m": 30,
"state": "moving"
},
{
"type": "car",
"color": "black",
"position": "front-right",
"distance_m": 15,
"state": "parked"
},
{
"type": "car",
"color": "white",
"position": "front-right",
"distance_m": 20,
"state": "parked"
},
{
"type": "car",
"color": "black",
"position": "front-left",
"distance_m": 20,
"state": "parked"
},
{
"type": "car",
"color": "silver",
"position": "front-left",
"distance_m": 25,
"state": "parked"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 40,
"state": "moving"
},
{
"type": "car",
"color": "black",
"position": "back",
"distance_m": 45,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "back-left",
"distance_m": 35,
"state": "parked"
},
{
"type": "car",
"color": "white",
"position": "back-right",
"distance_m": 20,
"state": "parked"
},
{
"type": "van",
"color": "white",
"position": "back",
"distance_m": 50,
"state": "moving"
}
],
"pedestrians": [],
"cyclists": [],
"traffic_signs": [
{
"text": "NO PARKING ANY TIME",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "wet"
},
"weather": {
"condition": "rainy",
"visibility": "reduced"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 496,
"latency": 16.7,
"error": null
},
{
"model": "qwen-vl-max-latest",
"scene": "scene-0103",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "white",
"position": "front",
"distance_m": 25,
"state": "moving"
},
{
"type": "car",
"color": "black",
"position": "front",
"distance_m": 30,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 15,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 20,
"state": "moving"
}
],
"pedestrians": [
{
"position": "front-left",
"distance_m": 25,
"state": "moving"
},
{
"position": "front-right",
"distance_m": 30,
"state": "moving"
},
{
"position": "back-right",
"distance_m": 10,
"state": "moving"
}
],
"cyclists": [],
"traffic_signs": [
{
"text": "STOP",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 4
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "cloudy",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 315,
"latency": 13.7,
"error": null
},
{
"model": "qwen-vl-max-latest",
"scene": "scene-0553",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "black",
"position": "front-left",
"distance_m": 5,
"state": "stopped"
},
{
"type": "truck",
"color": "yellow",
"position": "back-right",
"distance_m": 10,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "back",
"distance_m": 12,
"state": "moving"
},
{
"type": "bus",
"color": "white",
"position": "front-left",
"distance_m": 30,
"state": "moving"
}
],
"pedestrians": [
{
"position": "front-left",
"distance_m": 15,
"state": "moving"
},
{
"position": "front-right",
"distance_m": 25,
"state": "moving"
}
],
"cyclists": [
{
"position": "front-right",
"distance_m": 18
}
],
"traffic_signs": [
{
"text": "STOP",
"position": "front-right"
},
{
"text": "NO TURN ON RED",
"position": "front-right"
},
{
"text": "SUMMER ST",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 346,
"latency": 16.4,
"error": null
},
{
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0234",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "white",
"position": "front",
"distance_m": 45,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "front",
"distance_m": 30,
"state": "moving"
},
{
"type": "truck",
"color": "white",
"position": "front-left",
"distance_m": 18,
"state": "moving"
},
{
"type": "car",
"color": "gray",
"position": "back",
"distance_m": 5,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 10,
"state": "moving"
},
{
"type": "suv",
"color": "black",
"position": "back-left",
"distance_m": 3,
"state": "moving"
}
],
"pedestrians": [
{
"position": "front-right",
"distance_m": 8,
"state": "moving"
},
{
"position": "front-right",
"distance_m": 12,
"state": "moving"
},
{
"position": "front",
"distance_m": 25,
"state": "moving"
},
{
"position": "front-left",
"distance_m": 20,
"state": "moving"
},
{
"position": "back-left",
"distance_m": 15,
"state": "moving"
}
],
"cyclists": [],
"traffic_signs": [
{
"text": "STOP",
"position": "front-right"
},
{
"text": "NO TURN ON RED",
"position": "front-right"
}
],
"traffic_cones": {
"count": 2
},
"barriers": {
"count": 4
},
"road": {
"type": "urban",
"lanes": 4,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": [
"bridge",
"railings",
"buildings"
]
},
"input_tokens": 2483,
"output_tokens": 451,
"latency": 24.5,
"error": null
},
{
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0044",
"parsed": {
"vehicles": [],
"pedestrians": [],
"cyclists": [
{
"position": "front-right",
"distance_m": 15
}
],
"traffic_signs": [
{
"text": "SCHOOL",
"position": "front"
},
{
"text": "STOP",
"position": "back"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 178,
"latency": 13.7,
"error": null
},
{
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0566",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "black",
"position": "front",
"distance_m": 25,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "front",
"distance_m": 30,
"state": "parked"
},
{
"type": "suv",
"color": "black",
"position": "front-right",
"distance_m": 15,
"state": "parked"
},
{
"type": "car",
"color": "white",
"position": "front-right",
"distance_m": 20,
"state": "parked"
},
{
"type": "car",
"color": "black",
"position": "front-left",
"distance_m": 18,
"state": "parked"
},
{
"type": "car",
"color": "silver",
"position": "back",
"distance_m": 10,
"state": "parked"
},
{
"type": "van",
"color": "white",
"position": "back",
"distance_m": 40,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back-right",
"distance_m": 8,
"state": "parked"
}
],
"pedestrians": [],
"cyclists": [],
"traffic_signs": [
{
"text": "NO PARKING ANY TIME",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "wet"
},
"weather": {
"condition": "rainy",
"visibility": "moderate"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 395,
"latency": 21.1,
"error": null
},
{
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0103",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "white",
"position": "front",
"distance_m": 35,
"state": "moving"
},
{
"type": "car",
"color": "black",
"position": "front",
"distance_m": 40,
"state": "moving"
},
{
"type": "car",
"color": "silver",
"position": "back",
"distance_m": 25,
"state": "moving"
},
{
"type": "car",
"color": "white",
"position": "back",
"distance_m": 30,
"state": "moving"
}
],
"pedestrians": [
{
"position": "front-right",
"distance_m": 15,
"state": "moving"
},
{
"position": "front-left",
"distance_m": 20,
"state": "moving"
},
{
"position": "back-right",
"distance_m": 8,
"state": "moving"
},
{
"position": "front",
"distance_m": 25,
"state": "moving"
},
{
"position": "front",
"distance_m": 30,
"state": "moving"
}
],
"cyclists": [],
"traffic_signs": [
{
"text": "STOP",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "cloudy",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 356,
"latency": 22.4,
"error": null
},
{
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0553",
"parsed": {
"vehicles": [
{
"type": "car",
"color": "black",
"position": "front-left",
"distance_m": 5,
"state": "parked"
},
{
"type": "truck",
"color": "yellow",
"position": "back",
"distance_m": 10,
"state": "moving"
},
{
"type": "suv",
"color": "silver",
"position": "back",
"distance_m": 8,
"state": "moving"
}
],
"pedestrians": [
{
"position": "front-left",
"distance_m": 15,
"state": "moving"
}
],
"cyclists": [
{
"position": "front",
"distance_m": 8
}
],
"traffic_signs": [
{
"text": "STOP",
"position": "front"
},
{
"text": "NO TURN ON RED",
"position": "front-right"
}
],
"traffic_cones": {
"count": 0
},
"barriers": {
"count": 0
},
"road": {
"type": "urban",
"lanes": 2,
"surface": "dry"
},
"weather": {
"condition": "sunny",
"visibility": "good"
},
"infrastructure": []
},
"input_tokens": 2483,
"output_tokens": 271,
"latency": 12.3,
"error": null
}
],
"evaluations": [
{
"category_recall": 0.667,
"recalled_categories": [
"car",
"pedestrian",
"traffic_cone",
"truck"
],
"missed_categories": [
"bus",
"trailer"
],
"false_categories": [
"barrier"
],
"count_errors": {
"pedestrian": {
"gt": 24,
"pred": 4,
"error": 20
},
"truck": {
"gt": 7,
"pred": 1,
"error": 6
},
"trailer": {
"gt": 2,
"pred": 0,
"error": 2
},
"car": {
"gt": 15,
"pred": 6,
"error": 9
},
"traffic_cone": {
"gt": 2,
"pred": 2,
"error": 0
},
"bus": {
"gt": 2,
"pred": 0,
"error": 2
}
},
"avg_count_mae": 6.5,
"near_recall": 0.6,
"mid_recall": 0.185,
"far_recall": 0.0,
"state_accuracy": 0.18,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"truck": 1,
"car": 6,
"pedestrian": 4,
"bicycle": 0,
"traffic_cone": 2,
"barrier": 4
},
"gt_counts": {
"car": 15,
"traffic_cone": 2,
"pedestrian": 24,
"truck": 7,
"trailer": 2,
"bus": 2
},
"model": "qwen-vl-max-latest",
"scene": "scene-0234",
"input_tokens": 2483,
"output_tokens": 456,
"latency": 20.6
},
{
"category_recall": 0.333,
"recalled_categories": [
"bicycle"
],
"missed_categories": [
"car",
"pedestrian"
],
"false_categories": [],
"count_errors": {
"bicycle": {
"gt": 2,
"pred": 1,
"error": 1
},
"car": {
"gt": 1,
"pred": 0,
"error": 1
},
"pedestrian": {
"gt": 2,
"pred": 0,
"error": 2
}
},
"avg_count_mae": 1.3,
"near_recall": 0.0,
"mid_recall": 0.0,
"far_recall": 0.0,
"state_accuracy": 0.0,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"pedestrian": 0,
"bicycle": 1,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"bicycle": 2,
"pedestrian": 2,
"car": 1
},
"model": "qwen-vl-max-latest",
"scene": "scene-0044",
"input_tokens": 2483,
"output_tokens": 144,
"latency": 12.1
},
{
"category_recall": 0.333,
"recalled_categories": [
"car"
],
"missed_categories": [
"bus",
"truck"
],
"false_categories": [],
"count_errors": {
"car": {
"gt": 34,
"pred": 11,
"error": 23
},
"truck": {
"gt": 1,
"pred": 0,
"error": 1
},
"bus": {
"gt": 1,
"pred": 0,
"error": 1
}
},
"avg_count_mae": 8.3,
"near_recall": 0.111,
"mid_recall": 0.375,
"far_recall": 0.333,
"state_accuracy": 0.222,
"weather_pred": "rainy",
"road_surface_pred": "wet",
"pred_counts": {
"car": 11,
"pedestrian": 0,
"bicycle": 0,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"car": 34,
"truck": 1,
"bus": 1
},
"model": "qwen-vl-max-latest",
"scene": "scene-0566",
"input_tokens": 2483,
"output_tokens": 496,
"latency": 16.7
},
{
"category_recall": 1.0,
"recalled_categories": [
"car",
"pedestrian"
],
"missed_categories": [],
"false_categories": [
"barrier"
],
"count_errors": {
"car": {
"gt": 4,
"pred": 4,
"error": 0
},
"pedestrian": {
"gt": 19,
"pred": 3,
"error": 16
}
},
"avg_count_mae": 8.0,
"near_recall": 0.4,
"mid_recall": 0.333,
"far_recall": 0.0,
"state_accuracy": 0.304,
"weather_pred": "cloudy",
"road_surface_pred": "dry",
"pred_counts": {
"car": 4,
"pedestrian": 3,
"bicycle": 0,
"traffic_cone": 0,
"barrier": 4
},
"gt_counts": {
"pedestrian": 19,
"car": 4
},
"model": "qwen-vl-max-latest",
"scene": "scene-0103",
"input_tokens": 2483,
"output_tokens": 315,
"latency": 13.7
},
{
"category_recall": 0.714,
"recalled_categories": [
"bicycle",
"bus",
"car",
"pedestrian",
"truck"
],
"missed_categories": [
"barrier",
"trailer"
],
"false_categories": [],
"count_errors": {
"pedestrian": {
"gt": 10,
"pred": 2,
"error": 8
},
"truck": {
"gt": 1,
"pred": 1,
"error": 0
},
"trailer": {
"gt": 1,
"pred": 0,
"error": 1
},
"car": {
"gt": 12,
"pred": 2,
"error": 10
},
"bicycle": {
"gt": 1,
"pred": 1,
"error": 0
},
"barrier": {
"gt": 12,
"pred": 0,
"error": 12
},
"bus": {
"gt": 2,
"pred": 1,
"error": 1
}
},
"avg_count_mae": 4.6,
"near_recall": 0.267,
"mid_recall": 0.154,
"far_recall": 0.0,
"state_accuracy": 0.185,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"car": 2,
"truck": 1,
"bus": 1,
"pedestrian": 2,
"bicycle": 1,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"car": 12,
"truck": 1,
"trailer": 1,
"barrier": 12,
"bicycle": 1,
"pedestrian": 10,
"bus": 2
},
"model": "qwen-vl-max-latest",
"scene": "scene-0553",
"input_tokens": 2483,
"output_tokens": 346,
"latency": 16.4
},
{
"category_recall": 0.667,
"recalled_categories": [
"car",
"pedestrian",
"traffic_cone",
"truck"
],
"missed_categories": [
"bus",
"trailer"
],
"false_categories": [
"barrier"
],
"count_errors": {
"pedestrian": {
"gt": 24,
"pred": 5,
"error": 19
},
"truck": {
"gt": 7,
"pred": 1,
"error": 6
},
"trailer": {
"gt": 2,
"pred": 0,
"error": 2
},
"car": {
"gt": 15,
"pred": 5,
"error": 10
},
"traffic_cone": {
"gt": 2,
"pred": 2,
"error": 0
},
"bus": {
"gt": 2,
"pred": 0,
"error": 2
}
},
"avg_count_mae": 6.5,
"near_recall": 0.7,
"mid_recall": 0.148,
"far_recall": 0.0,
"state_accuracy": 0.16,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"car": 5,
"truck": 1,
"pedestrian": 5,
"bicycle": 0,
"traffic_cone": 2,
"barrier": 4
},
"gt_counts": {
"car": 15,
"traffic_cone": 2,
"pedestrian": 24,
"truck": 7,
"trailer": 2,
"bus": 2
},
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0234",
"input_tokens": 2483,
"output_tokens": 451,
"latency": 24.5
},
{
"category_recall": 0.333,
"recalled_categories": [
"bicycle"
],
"missed_categories": [
"car",
"pedestrian"
],
"false_categories": [],
"count_errors": {
"bicycle": {
"gt": 2,
"pred": 1,
"error": 1
},
"car": {
"gt": 1,
"pred": 0,
"error": 1
},
"pedestrian": {
"gt": 2,
"pred": 0,
"error": 2
}
},
"avg_count_mae": 1.3,
"near_recall": 0.0,
"mid_recall": 0.0,
"far_recall": 0.0,
"state_accuracy": 0.0,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"pedestrian": 0,
"bicycle": 1,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"bicycle": 2,
"pedestrian": 2,
"car": 1
},
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0044",
"input_tokens": 2483,
"output_tokens": 178,
"latency": 13.7
},
{
"category_recall": 0.333,
"recalled_categories": [
"car"
],
"missed_categories": [
"bus",
"truck"
],
"false_categories": [],
"count_errors": {
"car": {
"gt": 34,
"pred": 8,
"error": 26
},
"truck": {
"gt": 1,
"pred": 0,
"error": 1
},
"bus": {
"gt": 1,
"pred": 0,
"error": 1
}
},
"avg_count_mae": 9.3,
"near_recall": 0.444,
"mid_recall": 0.167,
"far_recall": 0.0,
"state_accuracy": 0.222,
"weather_pred": "rainy",
"road_surface_pred": "wet",
"pred_counts": {
"car": 8,
"pedestrian": 0,
"bicycle": 0,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"car": 34,
"truck": 1,
"bus": 1
},
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0566",
"input_tokens": 2483,
"output_tokens": 395,
"latency": 21.1
},
{
"category_recall": 1.0,
"recalled_categories": [
"car",
"pedestrian"
],
"missed_categories": [],
"false_categories": [],
"count_errors": {
"car": {
"gt": 4,
"pred": 4,
"error": 0
},
"pedestrian": {
"gt": 19,
"pred": 5,
"error": 14
}
},
"avg_count_mae": 7.0,
"near_recall": 0.4,
"mid_recall": 0.467,
"far_recall": 0.0,
"state_accuracy": 0.391,
"weather_pred": "cloudy",
"road_surface_pred": "dry",
"pred_counts": {
"car": 4,
"pedestrian": 5,
"bicycle": 0,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"pedestrian": 19,
"car": 4
},
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0103",
"input_tokens": 2483,
"output_tokens": 356,
"latency": 22.4
},
{
"category_recall": 0.571,
"recalled_categories": [
"bicycle",
"car",
"pedestrian",
"truck"
],
"missed_categories": [
"barrier",
"bus",
"trailer"
],
"false_categories": [],
"count_errors": {
"pedestrian": {
"gt": 10,
"pred": 1,
"error": 9
},
"truck": {
"gt": 1,
"pred": 1,
"error": 0
},
"trailer": {
"gt": 1,
"pred": 0,
"error": 1
},
"car": {
"gt": 12,
"pred": 2,
"error": 10
},
"bicycle": {
"gt": 1,
"pred": 1,
"error": 0
},
"barrier": {
"gt": 12,
"pred": 0,
"error": 12
},
"bus": {
"gt": 2,
"pred": 0,
"error": 2
}
},
"avg_count_mae": 4.9,
"near_recall": 0.267,
"mid_recall": 0.0,
"far_recall": 0.0,
"state_accuracy": 0.111,
"weather_pred": "sunny",
"road_surface_pred": "dry",
"pred_counts": {
"car": 2,
"truck": 1,
"pedestrian": 1,
"bicycle": 1,
"traffic_cone": 0,
"barrier": 0
},
"gt_counts": {
"car": 12,
"truck": 1,
"trailer": 1,
"barrier": 12,
"bicycle": 1,
"pedestrian": 10,
"bus": 2
},
"model": "qwen3-vl-235b-a22b-instruct",
"scene": "scene-0553",
"input_tokens": 2483,
"output_tokens": 271,
"latency": 12.3
}
]
}