diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,13229 @@ +{ + "best_global_step": 8700, + "best_metric": 0.6588571428571428, + "best_model_checkpoint": "/workspace/wcp/train_copy/models/pano_qwen3_5_new_val_cross_fixed_train_final_1M_065indoor/checkpoint-8700", + "epoch": 0.24934082311131492, + "eval_steps": 300, + "global_step": 8700, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.00014329932362719248, + "grad_norm": 130.10176283800956, + "learning_rate": 3.82043935052531e-09, + "loss": 3.3757232666015624, + "step": 5 + }, + { + "epoch": 0.00028659864725438496, + "grad_norm": 130.70226030791696, + "learning_rate": 8.595988538681948e-09, + "loss": 3.230146026611328, + "step": 10 + }, + { + "epoch": 0.00042989797088157744, + "grad_norm": 130.5898462093005, + "learning_rate": 1.3371537726838587e-08, + "loss": 3.315180206298828, + "step": 15 + }, + { + "epoch": 0.0005731972945087699, + "grad_norm": 192.4699018465675, + "learning_rate": 1.8147086914995226e-08, + "loss": 3.4893402099609374, + "step": 20 + }, + { + "epoch": 0.0007164966181359624, + "grad_norm": 289.49748171548947, + "learning_rate": 2.292263610315186e-08, + "loss": 3.3964767456054688, + "step": 25 + }, + { + "epoch": 0.0008597959417631549, + "grad_norm": 158.20134529620628, + "learning_rate": 2.76981852913085e-08, + "loss": 3.41004638671875, + "step": 30 + }, + { + "epoch": 0.0010030952653903474, + "grad_norm": 113.48876008679255, + "learning_rate": 3.2473734479465135e-08, + "loss": 3.557101821899414, + "step": 35 + }, + { + "epoch": 0.0011463945890175398, + "grad_norm": 219.49622511171222, + "learning_rate": 3.724928366762178e-08, + "loss": 3.2947158813476562, + "step": 40 + }, + { + "epoch": 0.0012896939126447323, + "grad_norm": 402.71161927696795, + "learning_rate": 4.202483285577841e-08, + "loss": 3.4728763580322264, + "step": 45 + }, + { + "epoch": 0.0014329932362719248, + "grad_norm": 129.97309961901587, + "learning_rate": 4.680038204393505e-08, + "loss": 3.288340759277344, + "step": 50 + }, + { + "epoch": 0.0015762925598991173, + "grad_norm": 162.249090310583, + "learning_rate": 5.157593123209169e-08, + "loss": 3.2877471923828123, + "step": 55 + }, + { + "epoch": 0.0017195918835263098, + "grad_norm": 260.06846049796695, + "learning_rate": 5.635148042024833e-08, + "loss": 3.35028076171875, + "step": 60 + }, + { + "epoch": 0.0018628912071535022, + "grad_norm": 111.93475089143874, + "learning_rate": 6.112702960840496e-08, + "loss": 3.4910888671875, + "step": 65 + }, + { + "epoch": 0.0020061905307806947, + "grad_norm": 96.16550654427104, + "learning_rate": 6.59025787965616e-08, + "loss": 3.188486099243164, + "step": 70 + }, + { + "epoch": 0.0021494898544078874, + "grad_norm": 107.6661061797472, + "learning_rate": 7.067812798471824e-08, + "loss": 3.2005516052246095, + "step": 75 + }, + { + "epoch": 0.0022927891780350797, + "grad_norm": 123.95409609723227, + "learning_rate": 7.545367717287487e-08, + "loss": 3.0405881881713865, + "step": 80 + }, + { + "epoch": 0.0024360885016622724, + "grad_norm": 143.61758576872876, + "learning_rate": 8.022922636103152e-08, + "loss": 3.1121103286743166, + "step": 85 + }, + { + "epoch": 0.0025793878252894646, + "grad_norm": 117.99580076534836, + "learning_rate": 8.500477554918815e-08, + "loss": 2.9949695587158205, + "step": 90 + }, + { + "epoch": 0.0027226871489166573, + "grad_norm": 126.26479163504341, + "learning_rate": 8.978032473734479e-08, + "loss": 2.751686668395996, + "step": 95 + }, + { + "epoch": 0.0028659864725438496, + "grad_norm": 188.81339750595197, + "learning_rate": 9.455587392550144e-08, + "loss": 2.847269821166992, + "step": 100 + }, + { + "epoch": 0.0030092857961710423, + "grad_norm": 99.84633416001628, + "learning_rate": 9.933142311365806e-08, + "loss": 2.4627933502197266, + "step": 105 + }, + { + "epoch": 0.0031525851197982345, + "grad_norm": 114.00136620109149, + "learning_rate": 1.041069723018147e-07, + "loss": 2.59106559753418, + "step": 110 + }, + { + "epoch": 0.0032958844434254272, + "grad_norm": 111.41274131951891, + "learning_rate": 1.0888252148997135e-07, + "loss": 2.3305707931518556, + "step": 115 + }, + { + "epoch": 0.0034391837670526195, + "grad_norm": 201.10624042576345, + "learning_rate": 1.1365807067812797e-07, + "loss": 2.3272731781005858, + "step": 120 + }, + { + "epoch": 0.003582483090679812, + "grad_norm": 170.10713164117593, + "learning_rate": 1.1843361986628461e-07, + "loss": 2.212013053894043, + "step": 125 + }, + { + "epoch": 0.0037257824143070045, + "grad_norm": 91.2993128934437, + "learning_rate": 1.2320916905444125e-07, + "loss": 2.1927494049072265, + "step": 130 + }, + { + "epoch": 0.003869081737934197, + "grad_norm": 188.45361592406041, + "learning_rate": 1.279847182425979e-07, + "loss": 2.0792972564697267, + "step": 135 + }, + { + "epoch": 0.004012381061561389, + "grad_norm": 111.82053916005604, + "learning_rate": 1.3276026743075452e-07, + "loss": 2.190343475341797, + "step": 140 + }, + { + "epoch": 0.004155680385188582, + "grad_norm": 68.26247430922433, + "learning_rate": 1.3753581661891116e-07, + "loss": 1.9425752639770508, + "step": 145 + }, + { + "epoch": 0.004298979708815775, + "grad_norm": 88.1109381690401, + "learning_rate": 1.4231136580706783e-07, + "loss": 2.0469944000244142, + "step": 150 + }, + { + "epoch": 0.004442279032442967, + "grad_norm": 87.51626220247937, + "learning_rate": 1.4708691499522444e-07, + "loss": 2.019863319396973, + "step": 155 + }, + { + "epoch": 0.004585578356070159, + "grad_norm": 119.43247544454381, + "learning_rate": 1.5186246418338107e-07, + "loss": 2.0515605926513674, + "step": 160 + }, + { + "epoch": 0.004728877679697352, + "grad_norm": 79.46941263569782, + "learning_rate": 1.5663801337153774e-07, + "loss": 1.8794429779052735, + "step": 165 + }, + { + "epoch": 0.004872177003324545, + "grad_norm": 101.77199803410372, + "learning_rate": 1.6141356255969435e-07, + "loss": 1.9235395431518554, + "step": 170 + }, + { + "epoch": 0.005015476326951737, + "grad_norm": 88.15730892514743, + "learning_rate": 1.6618911174785099e-07, + "loss": 1.8856552124023438, + "step": 175 + }, + { + "epoch": 0.005158775650578929, + "grad_norm": 108.86609995191733, + "learning_rate": 1.7096466093600765e-07, + "loss": 1.7375839233398438, + "step": 180 + }, + { + "epoch": 0.0053020749742061215, + "grad_norm": 86.1624860138321, + "learning_rate": 1.7574021012416426e-07, + "loss": 1.872894859313965, + "step": 185 + }, + { + "epoch": 0.005445374297833315, + "grad_norm": 69.22011547242509, + "learning_rate": 1.805157593123209e-07, + "loss": 1.6851161956787108, + "step": 190 + }, + { + "epoch": 0.005588673621460507, + "grad_norm": 106.64775286278707, + "learning_rate": 1.8529130850047756e-07, + "loss": 1.7300590515136718, + "step": 195 + }, + { + "epoch": 0.005731972945087699, + "grad_norm": 102.45514918720728, + "learning_rate": 1.9006685768863417e-07, + "loss": 1.6235618591308594, + "step": 200 + }, + { + "epoch": 0.0058752722687148914, + "grad_norm": 72.44050463629189, + "learning_rate": 1.948424068767908e-07, + "loss": 1.5797079086303711, + "step": 205 + }, + { + "epoch": 0.006018571592342085, + "grad_norm": 81.7998599957329, + "learning_rate": 1.9961795606494748e-07, + "loss": 1.6043720245361328, + "step": 210 + }, + { + "epoch": 0.006161870915969277, + "grad_norm": 81.67682881050125, + "learning_rate": 2.043935052531041e-07, + "loss": 1.5952083587646484, + "step": 215 + }, + { + "epoch": 0.006305170239596469, + "grad_norm": 95.96431161893256, + "learning_rate": 2.0916905444126072e-07, + "loss": 1.5379167556762696, + "step": 220 + }, + { + "epoch": 0.006448469563223661, + "grad_norm": 54.51686897873967, + "learning_rate": 2.139446036294174e-07, + "loss": 1.4518994331359862, + "step": 225 + }, + { + "epoch": 0.0065917688868508545, + "grad_norm": 117.47381154963601, + "learning_rate": 2.18720152817574e-07, + "loss": 1.511873435974121, + "step": 230 + }, + { + "epoch": 0.006735068210478047, + "grad_norm": 85.73840378393272, + "learning_rate": 2.2349570200573064e-07, + "loss": 1.440812110900879, + "step": 235 + }, + { + "epoch": 0.006878367534105239, + "grad_norm": 96.16460720241353, + "learning_rate": 2.282712511938873e-07, + "loss": 1.4890948295593263, + "step": 240 + }, + { + "epoch": 0.007021666857732431, + "grad_norm": 74.67374794970482, + "learning_rate": 2.330468003820439e-07, + "loss": 1.4159594535827638, + "step": 245 + }, + { + "epoch": 0.007164966181359624, + "grad_norm": 80.32553209291476, + "learning_rate": 2.3782234957020055e-07, + "loss": 1.3850113868713378, + "step": 250 + }, + { + "epoch": 0.007308265504986817, + "grad_norm": 60.91083935469522, + "learning_rate": 2.425978987583572e-07, + "loss": 1.336259651184082, + "step": 255 + }, + { + "epoch": 0.007451564828614009, + "grad_norm": 126.36425429661543, + "learning_rate": 2.473734479465138e-07, + "loss": 1.3669473648071289, + "step": 260 + }, + { + "epoch": 0.007594864152241201, + "grad_norm": 86.4189341237781, + "learning_rate": 2.5214899713467046e-07, + "loss": 1.3519164085388184, + "step": 265 + }, + { + "epoch": 0.007738163475868394, + "grad_norm": 92.48753379084371, + "learning_rate": 2.569245463228271e-07, + "loss": 1.2948493003845214, + "step": 270 + }, + { + "epoch": 0.007881462799495587, + "grad_norm": 73.93540696160484, + "learning_rate": 2.617000955109838e-07, + "loss": 1.242650604248047, + "step": 275 + }, + { + "epoch": 0.008024762123122779, + "grad_norm": 98.852775838745, + "learning_rate": 2.6647564469914043e-07, + "loss": 1.2157496452331542, + "step": 280 + }, + { + "epoch": 0.008168061446749971, + "grad_norm": 96.28361390934792, + "learning_rate": 2.71251193887297e-07, + "loss": 1.2824191093444823, + "step": 285 + }, + { + "epoch": 0.008311360770377163, + "grad_norm": 63.20779426893593, + "learning_rate": 2.7602674307545365e-07, + "loss": 1.1292677879333497, + "step": 290 + }, + { + "epoch": 0.008454660094004356, + "grad_norm": 57.670170338188996, + "learning_rate": 2.808022922636103e-07, + "loss": 1.1830550193786622, + "step": 295 + }, + { + "epoch": 0.00859795941763155, + "grad_norm": 83.73732146138217, + "learning_rate": 2.855778414517669e-07, + "loss": 1.1932281494140624, + "step": 300 + }, + { + "epoch": 0.00859795941763155, + "eval_bfov_iou": 0.02609686632335233, + "eval_bfov_iou@0.1": 0.104, + "eval_bfov_iou@0.25": 0.012, + "eval_bfov_iou@0.5": 0.0, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.3028571428571429, + "eval_exact_match": 0.2545, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 351.812, + "eval_samples_per_second": 5.685, + "eval_steps_per_second": 0.179, + "eval_task_acc_absolute_direction_mc": 0.248, + "eval_task_acc_camera_rotation_transform_mc": 0.192, + "eval_task_acc_object_conditioned_reorientation_mc": 0.236, + "eval_task_acc_observer_distance_choice": 0.472, + "eval_task_acc_relative_3d_position_mc": 0.268, + "eval_task_acc_relative_direction_mc": 0.316, + "eval_task_acc_seam_continuity_mc": 0.388, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.104, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.012, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.0, + "eval_task_bfov_iou_referring_grounding_bfov": 0.02609686632335233, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 300 + }, + { + "epoch": 0.008741258741258742, + "grad_norm": 122.17836330190953, + "learning_rate": 2.903533906399236e-07, + "loss": 1.0471515655517578, + "step": 305 + }, + { + "epoch": 0.008884558064885934, + "grad_norm": 75.3204294492472, + "learning_rate": 2.9512893982808025e-07, + "loss": 1.0754579544067382, + "step": 310 + }, + { + "epoch": 0.009027857388513126, + "grad_norm": 67.59168909409598, + "learning_rate": 2.9990448901623684e-07, + "loss": 1.0619507789611817, + "step": 315 + }, + { + "epoch": 0.009171156712140319, + "grad_norm": 90.13794806387445, + "learning_rate": 3.046800382043935e-07, + "loss": 1.0815265655517579, + "step": 320 + }, + { + "epoch": 0.009314456035767511, + "grad_norm": 116.19322266503163, + "learning_rate": 3.094555873925501e-07, + "loss": 1.0257113456726075, + "step": 325 + }, + { + "epoch": 0.009457755359394703, + "grad_norm": 168.2648496752938, + "learning_rate": 3.1423113658070675e-07, + "loss": 0.9958287239074707, + "step": 330 + }, + { + "epoch": 0.009601054683021895, + "grad_norm": 72.57307784747061, + "learning_rate": 3.1900668576886344e-07, + "loss": 1.0373401641845703, + "step": 335 + }, + { + "epoch": 0.00974435400664909, + "grad_norm": 89.83049894808619, + "learning_rate": 3.237822349570201e-07, + "loss": 0.9914106369018555, + "step": 340 + }, + { + "epoch": 0.009887653330276282, + "grad_norm": 84.87334233341636, + "learning_rate": 3.2855778414517666e-07, + "loss": 1.009526252746582, + "step": 345 + }, + { + "epoch": 0.010030952653903474, + "grad_norm": 122.43797663658873, + "learning_rate": 3.333333333333333e-07, + "loss": 0.9597312927246093, + "step": 350 + }, + { + "epoch": 0.010174251977530666, + "grad_norm": 68.89253357058959, + "learning_rate": 3.3810888252148994e-07, + "loss": 0.9659263610839843, + "step": 355 + }, + { + "epoch": 0.010317551301157859, + "grad_norm": 82.63498627137628, + "learning_rate": 3.428844317096466e-07, + "loss": 1.0139739036560058, + "step": 360 + }, + { + "epoch": 0.01046085062478505, + "grad_norm": 92.33208148988926, + "learning_rate": 3.4765998089780327e-07, + "loss": 0.945893669128418, + "step": 365 + }, + { + "epoch": 0.010604149948412243, + "grad_norm": 97.30020227252153, + "learning_rate": 3.524355300859599e-07, + "loss": 0.9304169654846192, + "step": 370 + }, + { + "epoch": 0.010747449272039435, + "grad_norm": 96.1087469103912, + "learning_rate": 3.5721107927411654e-07, + "loss": 0.9498260498046875, + "step": 375 + }, + { + "epoch": 0.01089074859566663, + "grad_norm": 50.64594283905199, + "learning_rate": 3.619866284622731e-07, + "loss": 0.9736908912658692, + "step": 380 + }, + { + "epoch": 0.011034047919293822, + "grad_norm": 80.108084437732, + "learning_rate": 3.6676217765042976e-07, + "loss": 0.9271239280700684, + "step": 385 + }, + { + "epoch": 0.011177347242921014, + "grad_norm": 100.62426433824146, + "learning_rate": 3.715377268385864e-07, + "loss": 0.9057989120483398, + "step": 390 + }, + { + "epoch": 0.011320646566548206, + "grad_norm": 95.9609378940049, + "learning_rate": 3.763132760267431e-07, + "loss": 0.9005050659179688, + "step": 395 + }, + { + "epoch": 0.011463945890175398, + "grad_norm": 60.45814354732819, + "learning_rate": 3.8108882521489973e-07, + "loss": 0.9010601043701172, + "step": 400 + }, + { + "epoch": 0.01160724521380259, + "grad_norm": 62.095490076953666, + "learning_rate": 3.8586437440305637e-07, + "loss": 0.8139686584472656, + "step": 405 + }, + { + "epoch": 0.011750544537429783, + "grad_norm": 78.38434787265233, + "learning_rate": 3.9063992359121295e-07, + "loss": 0.9032320022583008, + "step": 410 + }, + { + "epoch": 0.011893843861056975, + "grad_norm": 65.65753184750139, + "learning_rate": 3.954154727793696e-07, + "loss": 0.8701926231384277, + "step": 415 + }, + { + "epoch": 0.01203714318468417, + "grad_norm": 105.14629416142066, + "learning_rate": 4.001910219675262e-07, + "loss": 0.8793960571289062, + "step": 420 + }, + { + "epoch": 0.012180442508311361, + "grad_norm": 57.07692452691585, + "learning_rate": 4.0496657115568286e-07, + "loss": 0.798529863357544, + "step": 425 + }, + { + "epoch": 0.012323741831938554, + "grad_norm": 58.06041883295279, + "learning_rate": 4.0974212034383955e-07, + "loss": 0.8588464736938477, + "step": 430 + }, + { + "epoch": 0.012467041155565746, + "grad_norm": 120.85895407683293, + "learning_rate": 4.145176695319962e-07, + "loss": 0.8535245895385742, + "step": 435 + }, + { + "epoch": 0.012610340479192938, + "grad_norm": 69.78052728059644, + "learning_rate": 4.192932187201528e-07, + "loss": 0.870508861541748, + "step": 440 + }, + { + "epoch": 0.01275363980282013, + "grad_norm": 80.95992426277672, + "learning_rate": 4.240687679083094e-07, + "loss": 0.8594521522521973, + "step": 445 + }, + { + "epoch": 0.012896939126447323, + "grad_norm": 63.10957991425338, + "learning_rate": 4.2884431709646605e-07, + "loss": 0.8154410362243653, + "step": 450 + }, + { + "epoch": 0.013040238450074515, + "grad_norm": 67.56654758418644, + "learning_rate": 4.336198662846227e-07, + "loss": 0.7830872058868408, + "step": 455 + }, + { + "epoch": 0.013183537773701709, + "grad_norm": 65.20991286823205, + "learning_rate": 4.383954154727794e-07, + "loss": 0.8680972099304199, + "step": 460 + }, + { + "epoch": 0.013326837097328901, + "grad_norm": 50.89289092397765, + "learning_rate": 4.43170964660936e-07, + "loss": 0.8447091102600097, + "step": 465 + }, + { + "epoch": 0.013470136420956094, + "grad_norm": 52.607139515409564, + "learning_rate": 4.479465138490926e-07, + "loss": 0.8408245086669922, + "step": 470 + }, + { + "epoch": 0.013613435744583286, + "grad_norm": 51.38814380019669, + "learning_rate": 4.5272206303724924e-07, + "loss": 0.7987042427062988, + "step": 475 + }, + { + "epoch": 0.013756735068210478, + "grad_norm": 51.92115077259463, + "learning_rate": 4.574976122254059e-07, + "loss": 0.882794189453125, + "step": 480 + }, + { + "epoch": 0.01390003439183767, + "grad_norm": 50.62852722842443, + "learning_rate": 4.622731614135625e-07, + "loss": 0.7965161323547363, + "step": 485 + }, + { + "epoch": 0.014043333715464863, + "grad_norm": 63.61565902973772, + "learning_rate": 4.670487106017192e-07, + "loss": 0.7446679592132568, + "step": 490 + }, + { + "epoch": 0.014186633039092055, + "grad_norm": 110.49200142955499, + "learning_rate": 4.7182425978987584e-07, + "loss": 0.798860740661621, + "step": 495 + }, + { + "epoch": 0.014329932362719249, + "grad_norm": 55.21597443276797, + "learning_rate": 4.7659980897803243e-07, + "loss": 0.7925246238708497, + "step": 500 + }, + { + "epoch": 0.014473231686346441, + "grad_norm": 59.31338371494678, + "learning_rate": 4.813753581661891e-07, + "loss": 0.8457393646240234, + "step": 505 + }, + { + "epoch": 0.014616531009973633, + "grad_norm": 77.3888982547293, + "learning_rate": 4.861509073543458e-07, + "loss": 0.7869475364685059, + "step": 510 + }, + { + "epoch": 0.014759830333600826, + "grad_norm": 90.74736530347278, + "learning_rate": 4.909264565425023e-07, + "loss": 0.8398687362670898, + "step": 515 + }, + { + "epoch": 0.014903129657228018, + "grad_norm": 51.458344555092886, + "learning_rate": 4.95702005730659e-07, + "loss": 0.733098030090332, + "step": 520 + }, + { + "epoch": 0.01504642898085521, + "grad_norm": 69.1859065334128, + "learning_rate": 5.004775549188156e-07, + "loss": 0.7724692344665527, + "step": 525 + }, + { + "epoch": 0.015189728304482402, + "grad_norm": 79.91397519513876, + "learning_rate": 5.052531041069723e-07, + "loss": 0.7552727222442627, + "step": 530 + }, + { + "epoch": 0.015333027628109595, + "grad_norm": 58.153906888190434, + "learning_rate": 5.100286532951289e-07, + "loss": 0.7707069873809814, + "step": 535 + }, + { + "epoch": 0.015476326951736789, + "grad_norm": 42.05524638723864, + "learning_rate": 5.148042024832856e-07, + "loss": 0.8209079742431641, + "step": 540 + }, + { + "epoch": 0.015619626275363981, + "grad_norm": 46.648965196761914, + "learning_rate": 5.195797516714422e-07, + "loss": 0.7787683486938477, + "step": 545 + }, + { + "epoch": 0.015762925598991173, + "grad_norm": 124.24898383402756, + "learning_rate": 5.243553008595987e-07, + "loss": 0.7473275184631347, + "step": 550 + }, + { + "epoch": 0.015906224922618364, + "grad_norm": 55.84236240605164, + "learning_rate": 5.291308500477554e-07, + "loss": 0.7558280944824218, + "step": 555 + }, + { + "epoch": 0.016049524246245558, + "grad_norm": 61.992971083730424, + "learning_rate": 5.33906399235912e-07, + "loss": 0.6905023574829101, + "step": 560 + }, + { + "epoch": 0.01619282356987275, + "grad_norm": 47.25305177335136, + "learning_rate": 5.386819484240688e-07, + "loss": 0.7630768299102784, + "step": 565 + }, + { + "epoch": 0.016336122893499942, + "grad_norm": 80.86653773794455, + "learning_rate": 5.434574976122254e-07, + "loss": 0.7431544303894043, + "step": 570 + }, + { + "epoch": 0.016479422217127136, + "grad_norm": 81.94020040391712, + "learning_rate": 5.482330468003821e-07, + "loss": 0.7615414619445801, + "step": 575 + }, + { + "epoch": 0.016622721540754327, + "grad_norm": 56.642441724123906, + "learning_rate": 5.530085959885387e-07, + "loss": 0.7639039993286133, + "step": 580 + }, + { + "epoch": 0.01676602086438152, + "grad_norm": 72.30430129067621, + "learning_rate": 5.577841451766953e-07, + "loss": 0.7447667598724366, + "step": 585 + }, + { + "epoch": 0.01690932018800871, + "grad_norm": 88.77644445347704, + "learning_rate": 5.62559694364852e-07, + "loss": 0.7262200355529785, + "step": 590 + }, + { + "epoch": 0.017052619511635905, + "grad_norm": 64.48960705543927, + "learning_rate": 5.673352435530085e-07, + "loss": 0.7450263977050782, + "step": 595 + }, + { + "epoch": 0.0171959188352631, + "grad_norm": 70.5551482506562, + "learning_rate": 5.721107927411652e-07, + "loss": 0.7429435729980469, + "step": 600 + }, + { + "epoch": 0.0171959188352631, + "eval_bfov_iou": 0.1641713707945324, + "eval_bfov_iou@0.1": 0.548, + "eval_bfov_iou@0.25": 0.256, + "eval_bfov_iou@0.5": 0.064, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.31257142857142856, + "eval_exact_match": 0.2415, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 350.95, + "eval_samples_per_second": 5.699, + "eval_steps_per_second": 0.18, + "eval_task_acc_absolute_direction_mc": 0.256, + "eval_task_acc_camera_rotation_transform_mc": 0.216, + "eval_task_acc_object_conditioned_reorientation_mc": 0.208, + "eval_task_acc_observer_distance_choice": 0.464, + "eval_task_acc_relative_3d_position_mc": 0.348, + "eval_task_acc_relative_direction_mc": 0.284, + "eval_task_acc_seam_continuity_mc": 0.412, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.548, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.256, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.064, + "eval_task_bfov_iou_referring_grounding_bfov": 0.1641713707945324, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 600 + }, + { + "epoch": 0.01733921815889029, + "grad_norm": 69.88618119492456, + "learning_rate": 5.768863419293218e-07, + "loss": 0.7494655132293702, + "step": 605 + }, + { + "epoch": 0.017482517482517484, + "grad_norm": 55.849153241828986, + "learning_rate": 5.816618911174784e-07, + "loss": 0.7436990737915039, + "step": 610 + }, + { + "epoch": 0.017625816806144674, + "grad_norm": 58.85527402273844, + "learning_rate": 5.864374403056351e-07, + "loss": 0.7933513641357421, + "step": 615 + }, + { + "epoch": 0.01776911612977187, + "grad_norm": 48.92127278191289, + "learning_rate": 5.912129894937917e-07, + "loss": 0.7597901344299316, + "step": 620 + }, + { + "epoch": 0.01791241545339906, + "grad_norm": 43.492399822187785, + "learning_rate": 5.959885386819485e-07, + "loss": 0.7399725437164306, + "step": 625 + }, + { + "epoch": 0.018055714777026253, + "grad_norm": 46.787555466647206, + "learning_rate": 6.007640878701051e-07, + "loss": 0.7300666809082031, + "step": 630 + }, + { + "epoch": 0.018199014100653443, + "grad_norm": 46.54313358359434, + "learning_rate": 6.055396370582617e-07, + "loss": 0.7097491264343262, + "step": 635 + }, + { + "epoch": 0.018342313424280637, + "grad_norm": 43.61961178402363, + "learning_rate": 6.103151862464183e-07, + "loss": 0.7051525115966797, + "step": 640 + }, + { + "epoch": 0.01848561274790783, + "grad_norm": 37.851237656051474, + "learning_rate": 6.150907354345749e-07, + "loss": 0.7367287635803222, + "step": 645 + }, + { + "epoch": 0.018628912071535022, + "grad_norm": 50.74060991160376, + "learning_rate": 6.198662846227316e-07, + "loss": 0.7176387786865235, + "step": 650 + }, + { + "epoch": 0.018772211395162216, + "grad_norm": 59.401365852857396, + "learning_rate": 6.246418338108882e-07, + "loss": 0.665212345123291, + "step": 655 + }, + { + "epoch": 0.018915510718789406, + "grad_norm": 49.39819049695024, + "learning_rate": 6.294173829990449e-07, + "loss": 0.7215981006622314, + "step": 660 + }, + { + "epoch": 0.0190588100424166, + "grad_norm": 45.60400062773623, + "learning_rate": 6.341929321872015e-07, + "loss": 0.709835433959961, + "step": 665 + }, + { + "epoch": 0.01920210936604379, + "grad_norm": 62.161234369637455, + "learning_rate": 6.389684813753582e-07, + "loss": 0.7342443466186523, + "step": 670 + }, + { + "epoch": 0.019345408689670985, + "grad_norm": 158.05160027183524, + "learning_rate": 6.437440305635147e-07, + "loss": 0.6643121719360352, + "step": 675 + }, + { + "epoch": 0.01948870801329818, + "grad_norm": 82.40723560418456, + "learning_rate": 6.485195797516713e-07, + "loss": 0.7029075622558594, + "step": 680 + }, + { + "epoch": 0.01963200733692537, + "grad_norm": 48.79366277509127, + "learning_rate": 6.532951289398281e-07, + "loss": 0.6588919639587403, + "step": 685 + }, + { + "epoch": 0.019775306660552563, + "grad_norm": 41.83717656255096, + "learning_rate": 6.580706781279847e-07, + "loss": 0.6964421749114991, + "step": 690 + }, + { + "epoch": 0.019918605984179754, + "grad_norm": 72.77043468965273, + "learning_rate": 6.628462273161414e-07, + "loss": 0.7852114677429199, + "step": 695 + }, + { + "epoch": 0.020061905307806948, + "grad_norm": 59.631871950746216, + "learning_rate": 6.67621776504298e-07, + "loss": 0.68681640625, + "step": 700 + }, + { + "epoch": 0.02020520463143414, + "grad_norm": 42.831187695579025, + "learning_rate": 6.723973256924546e-07, + "loss": 0.6987085342407227, + "step": 705 + }, + { + "epoch": 0.020348503955061333, + "grad_norm": 70.37143739470748, + "learning_rate": 6.771728748806113e-07, + "loss": 0.7043006420135498, + "step": 710 + }, + { + "epoch": 0.020491803278688523, + "grad_norm": 54.648618285050034, + "learning_rate": 6.819484240687678e-07, + "loss": 0.7310835838317871, + "step": 715 + }, + { + "epoch": 0.020635102602315717, + "grad_norm": 42.99014659906376, + "learning_rate": 6.867239732569245e-07, + "loss": 0.7152865409851075, + "step": 720 + }, + { + "epoch": 0.02077840192594291, + "grad_norm": 367.37998607015805, + "learning_rate": 6.914995224450811e-07, + "loss": 0.7284920692443848, + "step": 725 + }, + { + "epoch": 0.0209217012495701, + "grad_norm": 41.20857720520815, + "learning_rate": 6.962750716332378e-07, + "loss": 0.7173601150512695, + "step": 730 + }, + { + "epoch": 0.021065000573197296, + "grad_norm": 170.5579575483643, + "learning_rate": 7.010506208213944e-07, + "loss": 0.7092022895812988, + "step": 735 + }, + { + "epoch": 0.021208299896824486, + "grad_norm": 59.47688283569958, + "learning_rate": 7.05826170009551e-07, + "loss": 0.6626760959625244, + "step": 740 + }, + { + "epoch": 0.02135159922045168, + "grad_norm": 58.09863740267791, + "learning_rate": 7.106017191977078e-07, + "loss": 0.6575709342956543, + "step": 745 + }, + { + "epoch": 0.02149489854407887, + "grad_norm": 37.66092093338327, + "learning_rate": 7.153772683858644e-07, + "loss": 0.6713469505310059, + "step": 750 + }, + { + "epoch": 0.021638197867706065, + "grad_norm": 113.99120682824284, + "learning_rate": 7.20152817574021e-07, + "loss": 0.6624601364135743, + "step": 755 + }, + { + "epoch": 0.02178149719133326, + "grad_norm": 45.73730372319481, + "learning_rate": 7.249283667621776e-07, + "loss": 0.6718687057495117, + "step": 760 + }, + { + "epoch": 0.02192479651496045, + "grad_norm": 65.2090749282473, + "learning_rate": 7.297039159503342e-07, + "loss": 0.6731954574584961, + "step": 765 + }, + { + "epoch": 0.022068095838587643, + "grad_norm": 61.13810857228689, + "learning_rate": 7.344794651384909e-07, + "loss": 0.7001504898071289, + "step": 770 + }, + { + "epoch": 0.022211395162214834, + "grad_norm": 63.41943774276451, + "learning_rate": 7.392550143266475e-07, + "loss": 0.6852007865905761, + "step": 775 + }, + { + "epoch": 0.022354694485842028, + "grad_norm": 51.52982153313849, + "learning_rate": 7.440305635148042e-07, + "loss": 0.6658273696899414, + "step": 780 + }, + { + "epoch": 0.022497993809469218, + "grad_norm": 32.085580188873706, + "learning_rate": 7.488061127029608e-07, + "loss": 0.6417601585388184, + "step": 785 + }, + { + "epoch": 0.022641293133096412, + "grad_norm": 40.31080492895426, + "learning_rate": 7.535816618911175e-07, + "loss": 0.6568415641784668, + "step": 790 + }, + { + "epoch": 0.022784592456723603, + "grad_norm": 53.85520264647804, + "learning_rate": 7.58357211079274e-07, + "loss": 0.6954258918762207, + "step": 795 + }, + { + "epoch": 0.022927891780350797, + "grad_norm": 60.55353833241159, + "learning_rate": 7.631327602674306e-07, + "loss": 0.627980089187622, + "step": 800 + }, + { + "epoch": 0.02307119110397799, + "grad_norm": 53.70911376219644, + "learning_rate": 7.679083094555874e-07, + "loss": 0.6944860458374024, + "step": 805 + }, + { + "epoch": 0.02321449042760518, + "grad_norm": 45.99366473170338, + "learning_rate": 7.72683858643744e-07, + "loss": 0.7208085060119629, + "step": 810 + }, + { + "epoch": 0.023357789751232375, + "grad_norm": 39.122171682278285, + "learning_rate": 7.774594078319007e-07, + "loss": 0.6834659576416016, + "step": 815 + }, + { + "epoch": 0.023501089074859566, + "grad_norm": 39.74309372836488, + "learning_rate": 7.822349570200573e-07, + "loss": 0.6755227088928223, + "step": 820 + }, + { + "epoch": 0.02364438839848676, + "grad_norm": 65.0698749350878, + "learning_rate": 7.870105062082139e-07, + "loss": 0.6760683536529541, + "step": 825 + }, + { + "epoch": 0.02378768772211395, + "grad_norm": 75.52605835172653, + "learning_rate": 7.917860553963706e-07, + "loss": 0.6983874320983887, + "step": 830 + }, + { + "epoch": 0.023930987045741144, + "grad_norm": 55.65677775273731, + "learning_rate": 7.965616045845271e-07, + "loss": 0.6500906944274902, + "step": 835 + }, + { + "epoch": 0.02407428636936834, + "grad_norm": 39.607058631335654, + "learning_rate": 8.013371537726838e-07, + "loss": 0.6443074703216553, + "step": 840 + }, + { + "epoch": 0.02421758569299553, + "grad_norm": 39.585039057895955, + "learning_rate": 8.061127029608404e-07, + "loss": 0.7023961067199707, + "step": 845 + }, + { + "epoch": 0.024360885016622723, + "grad_norm": 56.6243804879083, + "learning_rate": 8.108882521489971e-07, + "loss": 0.6507768154144287, + "step": 850 + }, + { + "epoch": 0.024504184340249913, + "grad_norm": 91.99560296456713, + "learning_rate": 8.156638013371537e-07, + "loss": 0.6960889816284179, + "step": 855 + }, + { + "epoch": 0.024647483663877107, + "grad_norm": 64.13818228913684, + "learning_rate": 8.204393505253103e-07, + "loss": 0.6694812297821044, + "step": 860 + }, + { + "epoch": 0.024790782987504298, + "grad_norm": 84.53337605128041, + "learning_rate": 8.252148997134671e-07, + "loss": 0.656067943572998, + "step": 865 + }, + { + "epoch": 0.024934082311131492, + "grad_norm": 70.67007834975739, + "learning_rate": 8.299904489016237e-07, + "loss": 0.6631243705749512, + "step": 870 + }, + { + "epoch": 0.025077381634758682, + "grad_norm": 33.79573199554692, + "learning_rate": 8.347659980897803e-07, + "loss": 0.6011233806610108, + "step": 875 + }, + { + "epoch": 0.025220680958385876, + "grad_norm": 46.24054836680697, + "learning_rate": 8.395415472779369e-07, + "loss": 0.6431049346923828, + "step": 880 + }, + { + "epoch": 0.02536398028201307, + "grad_norm": 32.887992712799154, + "learning_rate": 8.443170964660936e-07, + "loss": 0.6408469200134277, + "step": 885 + }, + { + "epoch": 0.02550727960564026, + "grad_norm": 27.81268911157461, + "learning_rate": 8.490926456542502e-07, + "loss": 0.6611164093017579, + "step": 890 + }, + { + "epoch": 0.025650578929267455, + "grad_norm": 71.69713139188882, + "learning_rate": 8.538681948424068e-07, + "loss": 0.6391455173492432, + "step": 895 + }, + { + "epoch": 0.025793878252894645, + "grad_norm": 60.997385164544866, + "learning_rate": 8.586437440305635e-07, + "loss": 0.6503280162811279, + "step": 900 + }, + { + "epoch": 0.025793878252894645, + "eval_bfov_iou": 0.4558129583692029, + "eval_bfov_iou@0.1": 0.912, + "eval_bfov_iou@0.25": 0.812, + "eval_bfov_iou@0.5": 0.452, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.3365714285714286, + "eval_exact_match": 0.243, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 369.3927, + "eval_samples_per_second": 5.414, + "eval_steps_per_second": 0.171, + "eval_task_acc_absolute_direction_mc": 0.3, + "eval_task_acc_camera_rotation_transform_mc": 0.172, + "eval_task_acc_object_conditioned_reorientation_mc": 0.208, + "eval_task_acc_observer_distance_choice": 0.54, + "eval_task_acc_relative_3d_position_mc": 0.42, + "eval_task_acc_relative_direction_mc": 0.276, + "eval_task_acc_seam_continuity_mc": 0.44, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.912, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.812, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.452, + "eval_task_bfov_iou_referring_grounding_bfov": 0.4558129583692029, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 900 + }, + { + "epoch": 0.02593717757652184, + "grad_norm": 56.480748571740996, + "learning_rate": 8.634192932187201e-07, + "loss": 0.6170445442199707, + "step": 905 + }, + { + "epoch": 0.02608047690014903, + "grad_norm": 67.71363156698493, + "learning_rate": 8.681948424068768e-07, + "loss": 0.7073025703430176, + "step": 910 + }, + { + "epoch": 0.026223776223776224, + "grad_norm": 57.74442984746083, + "learning_rate": 8.729703915950333e-07, + "loss": 0.6540967941284179, + "step": 915 + }, + { + "epoch": 0.026367075547403418, + "grad_norm": 45.52746612869743, + "learning_rate": 8.777459407831899e-07, + "loss": 0.6971283912658691, + "step": 920 + }, + { + "epoch": 0.02651037487103061, + "grad_norm": 39.51419300132075, + "learning_rate": 8.825214899713467e-07, + "loss": 0.6234081268310547, + "step": 925 + }, + { + "epoch": 0.026653674194657802, + "grad_norm": 85.3450891010822, + "learning_rate": 8.872970391595033e-07, + "loss": 0.596715259552002, + "step": 930 + }, + { + "epoch": 0.026796973518284993, + "grad_norm": 28.41240728227779, + "learning_rate": 8.9207258834766e-07, + "loss": 0.6642153263092041, + "step": 935 + }, + { + "epoch": 0.026940272841912187, + "grad_norm": 66.64217116833441, + "learning_rate": 8.968481375358166e-07, + "loss": 0.5892632484436036, + "step": 940 + }, + { + "epoch": 0.027083572165539378, + "grad_norm": 30.360930884450983, + "learning_rate": 9.016236867239733e-07, + "loss": 0.6081679344177247, + "step": 945 + }, + { + "epoch": 0.02722687148916657, + "grad_norm": 67.62166187604723, + "learning_rate": 9.063992359121299e-07, + "loss": 0.6434609889984131, + "step": 950 + }, + { + "epoch": 0.027370170812793762, + "grad_norm": 102.01742885592482, + "learning_rate": 9.111747851002864e-07, + "loss": 0.6533758163452148, + "step": 955 + }, + { + "epoch": 0.027513470136420956, + "grad_norm": 224.73654800202488, + "learning_rate": 9.159503342884431e-07, + "loss": 0.6353167533874512, + "step": 960 + }, + { + "epoch": 0.02765676946004815, + "grad_norm": 30.241621218656626, + "learning_rate": 9.207258834765997e-07, + "loss": 0.6277078628540039, + "step": 965 + }, + { + "epoch": 0.02780006878367534, + "grad_norm": 45.76936457396874, + "learning_rate": 9.255014326647564e-07, + "loss": 0.6722579956054687, + "step": 970 + }, + { + "epoch": 0.027943368107302535, + "grad_norm": 31.076271909224435, + "learning_rate": 9.30276981852913e-07, + "loss": 0.6344833374023438, + "step": 975 + }, + { + "epoch": 0.028086667430929725, + "grad_norm": 58.692989394973665, + "learning_rate": 9.350525310410696e-07, + "loss": 0.6422696113586426, + "step": 980 + }, + { + "epoch": 0.02822996675455692, + "grad_norm": 52.736925749812656, + "learning_rate": 9.398280802292264e-07, + "loss": 0.6317469596862793, + "step": 985 + }, + { + "epoch": 0.02837326607818411, + "grad_norm": 50.20605833812266, + "learning_rate": 9.44603629417383e-07, + "loss": 0.6544366836547851, + "step": 990 + }, + { + "epoch": 0.028516565401811304, + "grad_norm": 43.13088538434208, + "learning_rate": 9.493791786055396e-07, + "loss": 0.611246395111084, + "step": 995 + }, + { + "epoch": 0.028659864725438498, + "grad_norm": 39.2927192323527, + "learning_rate": 9.541547277936962e-07, + "loss": 0.6257678985595703, + "step": 1000 + }, + { + "epoch": 0.028803164049065688, + "grad_norm": 40.50206881691804, + "learning_rate": 9.589302769818528e-07, + "loss": 0.6232872009277344, + "step": 1005 + }, + { + "epoch": 0.028946463372692882, + "grad_norm": 35.83976992408765, + "learning_rate": 9.637058261700094e-07, + "loss": 0.6220196723937989, + "step": 1010 + }, + { + "epoch": 0.029089762696320073, + "grad_norm": 28.925157944158588, + "learning_rate": 9.684813753581662e-07, + "loss": 0.6185609817504882, + "step": 1015 + }, + { + "epoch": 0.029233062019947267, + "grad_norm": 34.78669555950643, + "learning_rate": 9.732569245463228e-07, + "loss": 0.7073936462402344, + "step": 1020 + }, + { + "epoch": 0.029376361343574457, + "grad_norm": 35.77460820802889, + "learning_rate": 9.780324737344794e-07, + "loss": 0.6411643981933594, + "step": 1025 + }, + { + "epoch": 0.02951966066720165, + "grad_norm": 305.1859951882744, + "learning_rate": 9.828080229226362e-07, + "loss": 0.6339746952056885, + "step": 1030 + }, + { + "epoch": 0.029662959990828842, + "grad_norm": 37.732835082937896, + "learning_rate": 9.875835721107928e-07, + "loss": 0.6380776405334473, + "step": 1035 + }, + { + "epoch": 0.029806259314456036, + "grad_norm": 39.40485036365009, + "learning_rate": 9.923591212989493e-07, + "loss": 0.6316628456115723, + "step": 1040 + }, + { + "epoch": 0.02994955863808323, + "grad_norm": 29.133675983264286, + "learning_rate": 9.97134670487106e-07, + "loss": 0.6149044036865234, + "step": 1045 + }, + { + "epoch": 0.03009285796171042, + "grad_norm": 38.094671113353215, + "learning_rate": 9.999999913839003e-07, + "loss": 0.600700855255127, + "step": 1050 + }, + { + "epoch": 0.030236157285337614, + "grad_norm": 77.11376613584996, + "learning_rate": 9.99999894452784e-07, + "loss": 0.6717242240905762, + "step": 1055 + }, + { + "epoch": 0.030379456608964805, + "grad_norm": 43.161173536246004, + "learning_rate": 9.99999689820448e-07, + "loss": 0.6150068283081055, + "step": 1060 + }, + { + "epoch": 0.030522755932592, + "grad_norm": 46.689495358393906, + "learning_rate": 9.99999377486936e-07, + "loss": 0.5671535491943359, + "step": 1065 + }, + { + "epoch": 0.03066605525621919, + "grad_norm": 60.13726472491902, + "learning_rate": 9.999989574523157e-07, + "loss": 0.665403938293457, + "step": 1070 + }, + { + "epoch": 0.030809354579846383, + "grad_norm": 66.0709782877259, + "learning_rate": 9.999984297166774e-07, + "loss": 0.5937241554260254, + "step": 1075 + }, + { + "epoch": 0.030952653903473577, + "grad_norm": 48.73325924250786, + "learning_rate": 9.99997794280135e-07, + "loss": 0.6143194198608398, + "step": 1080 + }, + { + "epoch": 0.031095953227100768, + "grad_norm": 53.15127172049473, + "learning_rate": 9.99997051142825e-07, + "loss": 0.5942808628082276, + "step": 1085 + }, + { + "epoch": 0.031239252550727962, + "grad_norm": 36.5314685625137, + "learning_rate": 9.999962003049077e-07, + "loss": 0.6289074420928955, + "step": 1090 + }, + { + "epoch": 0.03138255187435515, + "grad_norm": 83.39015481488379, + "learning_rate": 9.999952417665662e-07, + "loss": 0.6139866352081299, + "step": 1095 + }, + { + "epoch": 0.031525851197982346, + "grad_norm": 50.7607777368368, + "learning_rate": 9.999941755280072e-07, + "loss": 0.6560574054718018, + "step": 1100 + }, + { + "epoch": 0.03166915052160954, + "grad_norm": 34.19951483692593, + "learning_rate": 9.999930015894603e-07, + "loss": 0.6535513877868653, + "step": 1105 + }, + { + "epoch": 0.03181244984523673, + "grad_norm": 31.219708898172634, + "learning_rate": 9.999917199511783e-07, + "loss": 0.594221544265747, + "step": 1110 + }, + { + "epoch": 0.03195574916886392, + "grad_norm": 27.68625015365757, + "learning_rate": 9.999903306134372e-07, + "loss": 0.603395652770996, + "step": 1115 + }, + { + "epoch": 0.032099048492491115, + "grad_norm": 155.47849674093044, + "learning_rate": 9.999888335765366e-07, + "loss": 0.6014899253845215, + "step": 1120 + }, + { + "epoch": 0.03224234781611831, + "grad_norm": 76.24662984086913, + "learning_rate": 9.999872288407984e-07, + "loss": 0.6358906269073487, + "step": 1125 + }, + { + "epoch": 0.0323856471397455, + "grad_norm": 63.91069699821094, + "learning_rate": 9.99985516406569e-07, + "loss": 0.6691648960113525, + "step": 1130 + }, + { + "epoch": 0.03252894646337269, + "grad_norm": 32.44081143020695, + "learning_rate": 9.999836962742164e-07, + "loss": 0.5922126770019531, + "step": 1135 + }, + { + "epoch": 0.032672245786999884, + "grad_norm": 27.403693687225495, + "learning_rate": 9.999817684441336e-07, + "loss": 0.6368430614471435, + "step": 1140 + }, + { + "epoch": 0.03281554511062708, + "grad_norm": 50.95610682564922, + "learning_rate": 9.999797329167352e-07, + "loss": 0.6267875671386719, + "step": 1145 + }, + { + "epoch": 0.03295884443425427, + "grad_norm": 24.043545501438945, + "learning_rate": 9.999775896924599e-07, + "loss": 0.604363489151001, + "step": 1150 + }, + { + "epoch": 0.03310214375788146, + "grad_norm": 34.39148240872561, + "learning_rate": 9.99975338771769e-07, + "loss": 0.6185234069824219, + "step": 1155 + }, + { + "epoch": 0.033245443081508654, + "grad_norm": 31.02551101385872, + "learning_rate": 9.99972980155148e-07, + "loss": 0.6567314624786377, + "step": 1160 + }, + { + "epoch": 0.03338874240513585, + "grad_norm": 78.59402312088163, + "learning_rate": 9.999705138431044e-07, + "loss": 0.6364608764648437, + "step": 1165 + }, + { + "epoch": 0.03353204172876304, + "grad_norm": 36.66254892141864, + "learning_rate": 9.999679398361698e-07, + "loss": 0.5971811771392822, + "step": 1170 + }, + { + "epoch": 0.033675341052390236, + "grad_norm": 55.66005357450158, + "learning_rate": 9.999652581348986e-07, + "loss": 0.5670675277709961, + "step": 1175 + }, + { + "epoch": 0.03381864037601742, + "grad_norm": 36.44754264988773, + "learning_rate": 9.999624687398682e-07, + "loss": 0.6223600387573243, + "step": 1180 + }, + { + "epoch": 0.03396193969964462, + "grad_norm": 22.76944115556631, + "learning_rate": 9.999595716516796e-07, + "loss": 0.5807863712310791, + "step": 1185 + }, + { + "epoch": 0.03410523902327181, + "grad_norm": 244.55346476655757, + "learning_rate": 9.999565668709567e-07, + "loss": 0.6180659770965576, + "step": 1190 + }, + { + "epoch": 0.034248538346899005, + "grad_norm": 60.63970909266819, + "learning_rate": 9.99953454398347e-07, + "loss": 0.5860499382019043, + "step": 1195 + }, + { + "epoch": 0.0343918376705262, + "grad_norm": 39.383797355890714, + "learning_rate": 9.999502342345208e-07, + "loss": 0.5816361904144287, + "step": 1200 + }, + { + "epoch": 0.0343918376705262, + "eval_bfov_iou": 0.5854360651848624, + "eval_bfov_iou@0.1": 0.932, + "eval_bfov_iou@0.25": 0.88, + "eval_bfov_iou@0.5": 0.764, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.38, + "eval_exact_match": 0.285, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 354.7596, + "eval_samples_per_second": 5.638, + "eval_steps_per_second": 0.178, + "eval_task_acc_absolute_direction_mc": 0.444, + "eval_task_acc_camera_rotation_transform_mc": 0.192, + "eval_task_acc_object_conditioned_reorientation_mc": 0.208, + "eval_task_acc_observer_distance_choice": 0.556, + "eval_task_acc_relative_3d_position_mc": 0.484, + "eval_task_acc_relative_direction_mc": 0.3, + "eval_task_acc_seam_continuity_mc": 0.476, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.932, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.88, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.764, + "eval_task_bfov_iou_referring_grounding_bfov": 0.5854360651848624, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 1200 + }, + { + "epoch": 0.034535136994153386, + "grad_norm": 33.67437103532786, + "learning_rate": 9.999469063801717e-07, + "loss": 0.6367865562438965, + "step": 1205 + }, + { + "epoch": 0.03467843631778058, + "grad_norm": 38.967198035695745, + "learning_rate": 9.999434708360165e-07, + "loss": 0.5941066741943359, + "step": 1210 + }, + { + "epoch": 0.034821735641407774, + "grad_norm": 54.46787924110775, + "learning_rate": 9.999399276027953e-07, + "loss": 0.6401958465576172, + "step": 1215 + }, + { + "epoch": 0.03496503496503497, + "grad_norm": 22.705874563794737, + "learning_rate": 9.999362766812714e-07, + "loss": 0.5899722099304199, + "step": 1220 + }, + { + "epoch": 0.035108334288662155, + "grad_norm": 63.13333366895842, + "learning_rate": 9.999325180722311e-07, + "loss": 0.6191739082336426, + "step": 1225 + }, + { + "epoch": 0.03525163361228935, + "grad_norm": 49.67022099850108, + "learning_rate": 9.99928651776484e-07, + "loss": 0.6060976028442383, + "step": 1230 + }, + { + "epoch": 0.03539493293591654, + "grad_norm": 38.54317846096031, + "learning_rate": 9.99924677794863e-07, + "loss": 0.5866519927978515, + "step": 1235 + }, + { + "epoch": 0.03553823225954374, + "grad_norm": 42.194505865580645, + "learning_rate": 9.99920596128224e-07, + "loss": 0.6130558013916015, + "step": 1240 + }, + { + "epoch": 0.03568153158317093, + "grad_norm": 84.30115485746165, + "learning_rate": 9.999164067774462e-07, + "loss": 0.6192620277404786, + "step": 1245 + }, + { + "epoch": 0.03582483090679812, + "grad_norm": 40.60356406555794, + "learning_rate": 9.999121097434323e-07, + "loss": 0.5833636283874511, + "step": 1250 + }, + { + "epoch": 0.03596813023042531, + "grad_norm": 30.46650831613495, + "learning_rate": 9.999077050271074e-07, + "loss": 0.6079329490661621, + "step": 1255 + }, + { + "epoch": 0.036111429554052506, + "grad_norm": 32.18612999686701, + "learning_rate": 9.999031926294205e-07, + "loss": 0.6126091003417968, + "step": 1260 + }, + { + "epoch": 0.0362547288776797, + "grad_norm": 261.82717776085633, + "learning_rate": 9.998985725513438e-07, + "loss": 0.5822365760803223, + "step": 1265 + }, + { + "epoch": 0.03639802820130689, + "grad_norm": 33.90250839449857, + "learning_rate": 9.998938447938722e-07, + "loss": 0.5947070598602295, + "step": 1270 + }, + { + "epoch": 0.03654132752493408, + "grad_norm": 35.167595429615524, + "learning_rate": 9.99889009358024e-07, + "loss": 0.5951919555664062, + "step": 1275 + }, + { + "epoch": 0.036684626848561275, + "grad_norm": 56.30545928573922, + "learning_rate": 9.998840662448412e-07, + "loss": 0.5460718154907227, + "step": 1280 + }, + { + "epoch": 0.03682792617218847, + "grad_norm": 35.06154990067864, + "learning_rate": 9.998790154553882e-07, + "loss": 0.6114240646362304, + "step": 1285 + }, + { + "epoch": 0.03697122549581566, + "grad_norm": 58.3664091576006, + "learning_rate": 9.99873856990753e-07, + "loss": 0.5942163944244385, + "step": 1290 + }, + { + "epoch": 0.03711452481944285, + "grad_norm": 24.819406439888965, + "learning_rate": 9.998685908520467e-07, + "loss": 0.6213590145111084, + "step": 1295 + }, + { + "epoch": 0.037257824143070044, + "grad_norm": 45.42024852976097, + "learning_rate": 9.998632170404037e-07, + "loss": 0.6203494071960449, + "step": 1300 + }, + { + "epoch": 0.03740112346669724, + "grad_norm": 23.163303955306183, + "learning_rate": 9.998577355569818e-07, + "loss": 0.605250072479248, + "step": 1305 + }, + { + "epoch": 0.03754442279032443, + "grad_norm": 30.341203949072526, + "learning_rate": 9.998521464029613e-07, + "loss": 0.5750216484069824, + "step": 1310 + }, + { + "epoch": 0.03768772211395162, + "grad_norm": 24.22863971152501, + "learning_rate": 9.998464495795463e-07, + "loss": 0.5924405097961426, + "step": 1315 + }, + { + "epoch": 0.03783102143757881, + "grad_norm": 23.985923501373843, + "learning_rate": 9.99840645087964e-07, + "loss": 0.5776487350463867, + "step": 1320 + }, + { + "epoch": 0.03797432076120601, + "grad_norm": 29.488532821511203, + "learning_rate": 9.998347329294644e-07, + "loss": 0.6147611618041993, + "step": 1325 + }, + { + "epoch": 0.0381176200848332, + "grad_norm": 34.47361717931853, + "learning_rate": 9.998287131053214e-07, + "loss": 0.592649269104004, + "step": 1330 + }, + { + "epoch": 0.038260919408460395, + "grad_norm": 36.709396153937604, + "learning_rate": 9.998225856168314e-07, + "loss": 0.6391838073730469, + "step": 1335 + }, + { + "epoch": 0.03840421873208758, + "grad_norm": 29.966284585927152, + "learning_rate": 9.998163504653143e-07, + "loss": 0.6167519569396973, + "step": 1340 + }, + { + "epoch": 0.038547518055714776, + "grad_norm": 37.04837924130978, + "learning_rate": 9.998100076521134e-07, + "loss": 0.58936767578125, + "step": 1345 + }, + { + "epoch": 0.03869081737934197, + "grad_norm": 208.81732598111353, + "learning_rate": 9.998035571785946e-07, + "loss": 0.5955070972442627, + "step": 1350 + }, + { + "epoch": 0.038834116702969164, + "grad_norm": 31.34797290557625, + "learning_rate": 9.997969990461476e-07, + "loss": 0.6031423091888428, + "step": 1355 + }, + { + "epoch": 0.03897741602659636, + "grad_norm": 60.842619475324945, + "learning_rate": 9.99790333256185e-07, + "loss": 0.6312102317810059, + "step": 1360 + }, + { + "epoch": 0.039120715350223545, + "grad_norm": 30.74252128303714, + "learning_rate": 9.997835598101427e-07, + "loss": 0.5923074722290039, + "step": 1365 + }, + { + "epoch": 0.03926401467385074, + "grad_norm": 42.37088311102261, + "learning_rate": 9.997766787094795e-07, + "loss": 0.6326573371887207, + "step": 1370 + }, + { + "epoch": 0.03940731399747793, + "grad_norm": 64.6245720648295, + "learning_rate": 9.997696899556778e-07, + "loss": 0.5803810596466065, + "step": 1375 + }, + { + "epoch": 0.03955061332110513, + "grad_norm": 36.99711857777534, + "learning_rate": 9.997625935502429e-07, + "loss": 0.5959180355072021, + "step": 1380 + }, + { + "epoch": 0.039693912644732314, + "grad_norm": 45.1342997501112, + "learning_rate": 9.997553894947032e-07, + "loss": 0.5451254844665527, + "step": 1385 + }, + { + "epoch": 0.03983721196835951, + "grad_norm": 32.85007141100058, + "learning_rate": 9.99748077790611e-07, + "loss": 0.6074098587036133, + "step": 1390 + }, + { + "epoch": 0.0399805112919867, + "grad_norm": 63.71681664796796, + "learning_rate": 9.997406584395407e-07, + "loss": 0.6080751419067383, + "step": 1395 + }, + { + "epoch": 0.040123810615613896, + "grad_norm": 35.356840297351766, + "learning_rate": 9.997331314430907e-07, + "loss": 0.6093258857727051, + "step": 1400 + }, + { + "epoch": 0.04026710993924109, + "grad_norm": 39.49406430472693, + "learning_rate": 9.997254968028823e-07, + "loss": 0.6182333469390869, + "step": 1405 + }, + { + "epoch": 0.04041040926286828, + "grad_norm": 26.218433884495607, + "learning_rate": 9.997177545205602e-07, + "loss": 0.5911032676696777, + "step": 1410 + }, + { + "epoch": 0.04055370858649547, + "grad_norm": 45.11612109674152, + "learning_rate": 9.997099045977919e-07, + "loss": 0.5831490993499756, + "step": 1415 + }, + { + "epoch": 0.040697007910122665, + "grad_norm": 23.15996972040751, + "learning_rate": 9.997019470362682e-07, + "loss": 0.5892763137817383, + "step": 1420 + }, + { + "epoch": 0.04084030723374986, + "grad_norm": 21.88351046287805, + "learning_rate": 9.996938818377034e-07, + "loss": 0.5655601501464844, + "step": 1425 + }, + { + "epoch": 0.040983606557377046, + "grad_norm": 25.928903194286434, + "learning_rate": 9.996857090038346e-07, + "loss": 0.5461457729339599, + "step": 1430 + }, + { + "epoch": 0.04112690588100424, + "grad_norm": 56.1355351777455, + "learning_rate": 9.996774285364224e-07, + "loss": 0.5756010055541992, + "step": 1435 + }, + { + "epoch": 0.041270205204631434, + "grad_norm": 25.8994375549613, + "learning_rate": 9.996690404372503e-07, + "loss": 0.6152217864990235, + "step": 1440 + }, + { + "epoch": 0.04141350452825863, + "grad_norm": 42.36102799568622, + "learning_rate": 9.996605447081252e-07, + "loss": 0.5622048377990723, + "step": 1445 + }, + { + "epoch": 0.04155680385188582, + "grad_norm": 63.8408591754104, + "learning_rate": 9.996519413508772e-07, + "loss": 0.6180083751678467, + "step": 1450 + }, + { + "epoch": 0.04170010317551301, + "grad_norm": 54.46394452081972, + "learning_rate": 9.996432303673593e-07, + "loss": 0.5874021053314209, + "step": 1455 + }, + { + "epoch": 0.0418434024991402, + "grad_norm": 17.945536992184202, + "learning_rate": 9.996344117594478e-07, + "loss": 0.6068024635314941, + "step": 1460 + }, + { + "epoch": 0.0419867018227674, + "grad_norm": 31.435845286197598, + "learning_rate": 9.996254855290425e-07, + "loss": 0.6077653884887695, + "step": 1465 + }, + { + "epoch": 0.04213000114639459, + "grad_norm": 31.725744430508396, + "learning_rate": 9.99616451678066e-07, + "loss": 0.5838251113891602, + "step": 1470 + }, + { + "epoch": 0.04227330047002178, + "grad_norm": 29.508100658982357, + "learning_rate": 9.99607310208464e-07, + "loss": 0.6357110023498536, + "step": 1475 + }, + { + "epoch": 0.04241659979364897, + "grad_norm": 35.701280215144706, + "learning_rate": 9.99598061122206e-07, + "loss": 0.5749570369720459, + "step": 1480 + }, + { + "epoch": 0.042559899117276166, + "grad_norm": 33.32237985040215, + "learning_rate": 9.995887044212841e-07, + "loss": 0.6117693424224854, + "step": 1485 + }, + { + "epoch": 0.04270319844090336, + "grad_norm": 44.42884078033862, + "learning_rate": 9.995792401077138e-07, + "loss": 0.6032561779022216, + "step": 1490 + }, + { + "epoch": 0.042846497764530554, + "grad_norm": 30.322691287639998, + "learning_rate": 9.995696681835336e-07, + "loss": 0.5930624961853027, + "step": 1495 + }, + { + "epoch": 0.04298979708815774, + "grad_norm": 26.938783902207696, + "learning_rate": 9.995599886508055e-07, + "loss": 0.6056136131286621, + "step": 1500 + }, + { + "epoch": 0.04298979708815774, + "eval_bfov_iou": 0.6015087404077688, + "eval_bfov_iou@0.1": 0.968, + "eval_bfov_iou@0.25": 0.944, + "eval_bfov_iou@0.5": 0.8, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.416, + "eval_exact_match": 0.3255, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 339.1307, + "eval_samples_per_second": 5.897, + "eval_steps_per_second": 0.186, + "eval_task_acc_absolute_direction_mc": 0.616, + "eval_task_acc_camera_rotation_transform_mc": 0.2, + "eval_task_acc_object_conditioned_reorientation_mc": 0.208, + "eval_task_acc_observer_distance_choice": 0.556, + "eval_task_acc_relative_3d_position_mc": 0.468, + "eval_task_acc_relative_direction_mc": 0.32, + "eval_task_acc_seam_continuity_mc": 0.544, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.944, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.8, + "eval_task_bfov_iou_referring_grounding_bfov": 0.6015087404077688, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 1500 + }, + { + "epoch": 0.043133096411784935, + "grad_norm": 23.643153961031878, + "learning_rate": 9.995502015116145e-07, + "loss": 0.6367388725280761, + "step": 1505 + }, + { + "epoch": 0.04327639573541213, + "grad_norm": 52.184306363578266, + "learning_rate": 9.995403067680685e-07, + "loss": 0.5734808444976807, + "step": 1510 + }, + { + "epoch": 0.04341969505903932, + "grad_norm": 32.423337519137405, + "learning_rate": 9.995303044222988e-07, + "loss": 0.6106406211853027, + "step": 1515 + }, + { + "epoch": 0.04356299438266652, + "grad_norm": 30.374605706197183, + "learning_rate": 9.995201944764606e-07, + "loss": 0.6255788803100586, + "step": 1520 + }, + { + "epoch": 0.043706293706293704, + "grad_norm": 23.53235140835768, + "learning_rate": 9.99509976932731e-07, + "loss": 0.5909383773803711, + "step": 1525 + }, + { + "epoch": 0.0438495930299209, + "grad_norm": 22.032174383854553, + "learning_rate": 9.99499651793311e-07, + "loss": 0.5890019416809082, + "step": 1530 + }, + { + "epoch": 0.04399289235354809, + "grad_norm": 24.487779311492307, + "learning_rate": 9.994892190604247e-07, + "loss": 0.6494297027587891, + "step": 1535 + }, + { + "epoch": 0.044136191677175286, + "grad_norm": 27.7855873896967, + "learning_rate": 9.994786787363195e-07, + "loss": 0.6185944557189942, + "step": 1540 + }, + { + "epoch": 0.04427949100080247, + "grad_norm": 20.42038587700261, + "learning_rate": 9.994680308232654e-07, + "loss": 0.6078923225402832, + "step": 1545 + }, + { + "epoch": 0.04442279032442967, + "grad_norm": 43.397836413198576, + "learning_rate": 9.994572753235565e-07, + "loss": 0.5752403259277343, + "step": 1550 + }, + { + "epoch": 0.04456608964805686, + "grad_norm": 24.950794841440405, + "learning_rate": 9.994464122395093e-07, + "loss": 0.6042813301086426, + "step": 1555 + }, + { + "epoch": 0.044709388971684055, + "grad_norm": 25.646188820323864, + "learning_rate": 9.994354415734636e-07, + "loss": 0.584356689453125, + "step": 1560 + }, + { + "epoch": 0.04485268829531125, + "grad_norm": 27.844923363321794, + "learning_rate": 9.994243633277826e-07, + "loss": 0.600314712524414, + "step": 1565 + }, + { + "epoch": 0.044995987618938436, + "grad_norm": 34.78124108861982, + "learning_rate": 9.994131775048526e-07, + "loss": 0.5709603786468506, + "step": 1570 + }, + { + "epoch": 0.04513928694256563, + "grad_norm": 78.44439317018825, + "learning_rate": 9.994018841070834e-07, + "loss": 0.5600241184234619, + "step": 1575 + }, + { + "epoch": 0.045282586266192824, + "grad_norm": 66.3180893659036, + "learning_rate": 9.99390483136907e-07, + "loss": 0.592997932434082, + "step": 1580 + }, + { + "epoch": 0.04542588558982002, + "grad_norm": 28.409480438779294, + "learning_rate": 9.993789745967795e-07, + "loss": 0.5626708030700683, + "step": 1585 + }, + { + "epoch": 0.045569184913447205, + "grad_norm": 26.045791057381752, + "learning_rate": 9.993673584891802e-07, + "loss": 0.5609834671020508, + "step": 1590 + }, + { + "epoch": 0.0457124842370744, + "grad_norm": 36.054983332528394, + "learning_rate": 9.993556348166106e-07, + "loss": 0.5574330806732177, + "step": 1595 + }, + { + "epoch": 0.04585578356070159, + "grad_norm": 44.37759113219577, + "learning_rate": 9.993438035815964e-07, + "loss": 0.6001670837402344, + "step": 1600 + }, + { + "epoch": 0.04599908288432879, + "grad_norm": 29.005603162563798, + "learning_rate": 9.993318647866862e-07, + "loss": 0.5817459106445313, + "step": 1605 + }, + { + "epoch": 0.04614238220795598, + "grad_norm": 34.140335777506216, + "learning_rate": 9.993198184344513e-07, + "loss": 0.5673059940338134, + "step": 1610 + }, + { + "epoch": 0.04628568153158317, + "grad_norm": 87.71685790238983, + "learning_rate": 9.993076645274866e-07, + "loss": 0.5751641273498536, + "step": 1615 + }, + { + "epoch": 0.04642898085521036, + "grad_norm": 33.544307766626275, + "learning_rate": 9.992954030684103e-07, + "loss": 0.5851795196533203, + "step": 1620 + }, + { + "epoch": 0.046572280178837556, + "grad_norm": 24.78681809462253, + "learning_rate": 9.992830340598632e-07, + "loss": 0.6028999805450439, + "step": 1625 + }, + { + "epoch": 0.04671557950246475, + "grad_norm": 32.06779329837463, + "learning_rate": 9.9927055750451e-07, + "loss": 0.5816215515136719, + "step": 1630 + }, + { + "epoch": 0.04685887882609194, + "grad_norm": 33.49753302294949, + "learning_rate": 9.992579734050378e-07, + "loss": 0.5678863525390625, + "step": 1635 + }, + { + "epoch": 0.04700217814971913, + "grad_norm": 19.13123016674288, + "learning_rate": 9.992452817641575e-07, + "loss": 0.5840871334075928, + "step": 1640 + }, + { + "epoch": 0.047145477473346326, + "grad_norm": 33.82656518531454, + "learning_rate": 9.992324825846029e-07, + "loss": 0.5632320880889893, + "step": 1645 + }, + { + "epoch": 0.04728877679697352, + "grad_norm": 30.389250664716748, + "learning_rate": 9.992195758691308e-07, + "loss": 0.5983625411987304, + "step": 1650 + }, + { + "epoch": 0.047432076120600714, + "grad_norm": 39.205942967524166, + "learning_rate": 9.992065616205216e-07, + "loss": 0.5459277153015136, + "step": 1655 + }, + { + "epoch": 0.0475753754442279, + "grad_norm": 41.972000096251094, + "learning_rate": 9.991934398415784e-07, + "loss": 0.6136983871459961, + "step": 1660 + }, + { + "epoch": 0.047718674767855095, + "grad_norm": 39.06140166469386, + "learning_rate": 9.991802105351278e-07, + "loss": 0.5938082695007324, + "step": 1665 + }, + { + "epoch": 0.04786197409148229, + "grad_norm": 68.20516887597034, + "learning_rate": 9.991668737040194e-07, + "loss": 0.561781930923462, + "step": 1670 + }, + { + "epoch": 0.04800527341510948, + "grad_norm": 26.718237010760216, + "learning_rate": 9.991534293511257e-07, + "loss": 0.6001361846923828, + "step": 1675 + }, + { + "epoch": 0.04814857273873668, + "grad_norm": 23.262713765887433, + "learning_rate": 9.99139877479343e-07, + "loss": 0.5955245971679688, + "step": 1680 + }, + { + "epoch": 0.048291872062363864, + "grad_norm": 37.3139533244484, + "learning_rate": 9.991262180915904e-07, + "loss": 0.5704999923706054, + "step": 1685 + }, + { + "epoch": 0.04843517138599106, + "grad_norm": 24.081467313740635, + "learning_rate": 9.9911245119081e-07, + "loss": 0.5713274002075195, + "step": 1690 + }, + { + "epoch": 0.04857847070961825, + "grad_norm": 35.66519136824683, + "learning_rate": 9.99098576779967e-07, + "loss": 0.5671302795410156, + "step": 1695 + }, + { + "epoch": 0.048721770033245446, + "grad_norm": 23.30178918444992, + "learning_rate": 9.990845948620507e-07, + "loss": 0.6049543857574463, + "step": 1700 + }, + { + "epoch": 0.04886506935687263, + "grad_norm": 22.612230552016154, + "learning_rate": 9.99070505440072e-07, + "loss": 0.6073174476623535, + "step": 1705 + }, + { + "epoch": 0.04900836868049983, + "grad_norm": 99.05154103041548, + "learning_rate": 9.990563085170666e-07, + "loss": 0.5396961212158203, + "step": 1710 + }, + { + "epoch": 0.04915166800412702, + "grad_norm": 22.501874585443748, + "learning_rate": 9.990420040960919e-07, + "loss": 0.5594051361083985, + "step": 1715 + }, + { + "epoch": 0.049294967327754215, + "grad_norm": 26.51783806089847, + "learning_rate": 9.990275921802296e-07, + "loss": 0.5928513526916503, + "step": 1720 + }, + { + "epoch": 0.04943826665138141, + "grad_norm": 29.47193299404527, + "learning_rate": 9.990130727725835e-07, + "loss": 0.5328378200531005, + "step": 1725 + }, + { + "epoch": 0.049581565975008596, + "grad_norm": 33.68054032239375, + "learning_rate": 9.989984458762817e-07, + "loss": 0.5530153751373291, + "step": 1730 + }, + { + "epoch": 0.04972486529863579, + "grad_norm": 28.55268860083561, + "learning_rate": 9.989837114944743e-07, + "loss": 0.5732487201690674, + "step": 1735 + }, + { + "epoch": 0.049868164622262984, + "grad_norm": 41.926487225114435, + "learning_rate": 9.989688696303358e-07, + "loss": 0.5572394847869873, + "step": 1740 + }, + { + "epoch": 0.05001146394589018, + "grad_norm": 34.13115012574196, + "learning_rate": 9.989539202870627e-07, + "loss": 0.5792385101318359, + "step": 1745 + }, + { + "epoch": 0.050154763269517365, + "grad_norm": 30.006476203903045, + "learning_rate": 9.98938863467875e-07, + "loss": 0.5460923194885254, + "step": 1750 + }, + { + "epoch": 0.05029806259314456, + "grad_norm": 40.4970350141582, + "learning_rate": 9.989236991760164e-07, + "loss": 0.5735946655273437, + "step": 1755 + }, + { + "epoch": 0.05044136191677175, + "grad_norm": 57.021593038540196, + "learning_rate": 9.989084274147531e-07, + "loss": 0.5447168350219727, + "step": 1760 + }, + { + "epoch": 0.05058466124039895, + "grad_norm": 31.553107041886026, + "learning_rate": 9.988930481873748e-07, + "loss": 0.5943060398101807, + "step": 1765 + }, + { + "epoch": 0.05072796056402614, + "grad_norm": 63.61173473562259, + "learning_rate": 9.98877561497194e-07, + "loss": 0.5713775157928467, + "step": 1770 + }, + { + "epoch": 0.05087125988765333, + "grad_norm": 24.16464680098391, + "learning_rate": 9.988619673475468e-07, + "loss": 0.582763671875, + "step": 1775 + }, + { + "epoch": 0.05101455921128052, + "grad_norm": 37.57718597887904, + "learning_rate": 9.988462657417922e-07, + "loss": 0.5432621002197265, + "step": 1780 + }, + { + "epoch": 0.051157858534907716, + "grad_norm": 33.69960464148644, + "learning_rate": 9.98830456683312e-07, + "loss": 0.5683144569396973, + "step": 1785 + }, + { + "epoch": 0.05130115785853491, + "grad_norm": 28.884443286885894, + "learning_rate": 9.98814540175512e-07, + "loss": 0.5499480724334717, + "step": 1790 + }, + { + "epoch": 0.0514444571821621, + "grad_norm": 22.34855795748037, + "learning_rate": 9.987985162218203e-07, + "loss": 0.5896708011627197, + "step": 1795 + }, + { + "epoch": 0.05158775650578929, + "grad_norm": 26.511925214510494, + "learning_rate": 9.98782384825689e-07, + "loss": 0.5368827819824219, + "step": 1800 + }, + { + "epoch": 0.05158775650578929, + "eval_bfov_iou": 0.6771139578068157, + "eval_bfov_iou@0.1": 0.964, + "eval_bfov_iou@0.25": 0.956, + "eval_bfov_iou@0.5": 0.924, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.4542857142857143, + "eval_exact_match": 0.352, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 341.9579, + "eval_samples_per_second": 5.849, + "eval_steps_per_second": 0.184, + "eval_task_acc_absolute_direction_mc": 0.708, + "eval_task_acc_camera_rotation_transform_mc": 0.184, + "eval_task_acc_object_conditioned_reorientation_mc": 0.228, + "eval_task_acc_observer_distance_choice": 0.596, + "eval_task_acc_relative_3d_position_mc": 0.524, + "eval_task_acc_relative_direction_mc": 0.336, + "eval_task_acc_seam_continuity_mc": 0.604, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.964, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.956, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.924, + "eval_task_bfov_iou_referring_grounding_bfov": 0.6771139578068157, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 1800 + }, + { + "epoch": 0.051731055829416485, + "grad_norm": 42.65435094837691, + "learning_rate": 9.987661459905923e-07, + "loss": 0.6145731449127197, + "step": 1805 + }, + { + "epoch": 0.05187435515304368, + "grad_norm": 44.789916492010924, + "learning_rate": 9.987497997200282e-07, + "loss": 0.5795726776123047, + "step": 1810 + }, + { + "epoch": 0.05201765447667087, + "grad_norm": 24.695797989688508, + "learning_rate": 9.987333460175178e-07, + "loss": 0.5557641983032227, + "step": 1815 + }, + { + "epoch": 0.05216095380029806, + "grad_norm": 33.91647144029123, + "learning_rate": 9.987167848866054e-07, + "loss": 0.5380540370941163, + "step": 1820 + }, + { + "epoch": 0.052304253123925254, + "grad_norm": 23.97420629531828, + "learning_rate": 9.987001163308581e-07, + "loss": 0.6042009830474854, + "step": 1825 + }, + { + "epoch": 0.05244755244755245, + "grad_norm": 63.64092426767485, + "learning_rate": 9.986833403538666e-07, + "loss": 0.553748607635498, + "step": 1830 + }, + { + "epoch": 0.05259085177117964, + "grad_norm": 21.53379732332509, + "learning_rate": 9.986664569592442e-07, + "loss": 0.5428660392761231, + "step": 1835 + }, + { + "epoch": 0.052734151094806836, + "grad_norm": 39.35874968914829, + "learning_rate": 9.986494661506278e-07, + "loss": 0.5679403305053711, + "step": 1840 + }, + { + "epoch": 0.05287745041843402, + "grad_norm": 25.835328606057182, + "learning_rate": 9.98632367931677e-07, + "loss": 0.576496171951294, + "step": 1845 + }, + { + "epoch": 0.05302074974206122, + "grad_norm": 29.67603256879353, + "learning_rate": 9.986151623060751e-07, + "loss": 0.5492051124572754, + "step": 1850 + }, + { + "epoch": 0.05316404906568841, + "grad_norm": 31.71996725148325, + "learning_rate": 9.985978492775284e-07, + "loss": 0.5772919178009033, + "step": 1855 + }, + { + "epoch": 0.053307348389315605, + "grad_norm": 72.23935976424474, + "learning_rate": 9.985804288497657e-07, + "loss": 0.5503857612609864, + "step": 1860 + }, + { + "epoch": 0.05345064771294279, + "grad_norm": 26.660060296777587, + "learning_rate": 9.985629010265397e-07, + "loss": 0.558431339263916, + "step": 1865 + }, + { + "epoch": 0.053593947036569986, + "grad_norm": 27.908496555918365, + "learning_rate": 9.985452658116257e-07, + "loss": 0.5900987148284912, + "step": 1870 + }, + { + "epoch": 0.05373724636019718, + "grad_norm": 24.144660639572987, + "learning_rate": 9.985275232088227e-07, + "loss": 0.574009895324707, + "step": 1875 + }, + { + "epoch": 0.053880545683824374, + "grad_norm": 22.841400605841166, + "learning_rate": 9.985096732219522e-07, + "loss": 0.579985237121582, + "step": 1880 + }, + { + "epoch": 0.05402384500745157, + "grad_norm": 29.337941802137994, + "learning_rate": 9.984917158548593e-07, + "loss": 0.5782270431518555, + "step": 1885 + }, + { + "epoch": 0.054167144331078755, + "grad_norm": 19.92157207633127, + "learning_rate": 9.98473651111412e-07, + "loss": 0.5493410110473633, + "step": 1890 + }, + { + "epoch": 0.05431044365470595, + "grad_norm": 47.02921163120301, + "learning_rate": 9.984554789955014e-07, + "loss": 0.5648251533508301, + "step": 1895 + }, + { + "epoch": 0.05445374297833314, + "grad_norm": 22.15831935026846, + "learning_rate": 9.98437199511042e-07, + "loss": 0.5179810523986816, + "step": 1900 + }, + { + "epoch": 0.05459704230196034, + "grad_norm": 30.6533304425409, + "learning_rate": 9.984188126619714e-07, + "loss": 0.5594252109527588, + "step": 1905 + }, + { + "epoch": 0.054740341625587524, + "grad_norm": 63.89724911215796, + "learning_rate": 9.984003184522497e-07, + "loss": 0.5831832885742188, + "step": 1910 + }, + { + "epoch": 0.05488364094921472, + "grad_norm": 51.06749597072202, + "learning_rate": 9.98381716885861e-07, + "loss": 0.5748478889465332, + "step": 1915 + }, + { + "epoch": 0.05502694027284191, + "grad_norm": 29.068062964743937, + "learning_rate": 9.983630079668117e-07, + "loss": 0.5136538505554199, + "step": 1920 + }, + { + "epoch": 0.055170239596469106, + "grad_norm": 30.759049082821463, + "learning_rate": 9.983441916991322e-07, + "loss": 0.5646014213562012, + "step": 1925 + }, + { + "epoch": 0.0553135389200963, + "grad_norm": 25.933494027389095, + "learning_rate": 9.983252680868755e-07, + "loss": 0.5611042499542236, + "step": 1930 + }, + { + "epoch": 0.05545683824372349, + "grad_norm": 35.965247173200154, + "learning_rate": 9.983062371341176e-07, + "loss": 0.5771488189697266, + "step": 1935 + }, + { + "epoch": 0.05560013756735068, + "grad_norm": 28.081904836521595, + "learning_rate": 9.982870988449578e-07, + "loss": 0.5232611656188965, + "step": 1940 + }, + { + "epoch": 0.055743436890977875, + "grad_norm": 31.398913152730156, + "learning_rate": 9.982678532235187e-07, + "loss": 0.5805857658386231, + "step": 1945 + }, + { + "epoch": 0.05588673621460507, + "grad_norm": 26.674746883155656, + "learning_rate": 9.982485002739455e-07, + "loss": 0.5941373348236084, + "step": 1950 + }, + { + "epoch": 0.056030035538232256, + "grad_norm": 53.800675408079556, + "learning_rate": 9.982290400004076e-07, + "loss": 0.5326552867889405, + "step": 1955 + }, + { + "epoch": 0.05617333486185945, + "grad_norm": 21.36094040921514, + "learning_rate": 9.98209472407096e-07, + "loss": 0.5469865798950195, + "step": 1960 + }, + { + "epoch": 0.056316634185486644, + "grad_norm": 75.06674045571799, + "learning_rate": 9.981897974982262e-07, + "loss": 0.5263578414916992, + "step": 1965 + }, + { + "epoch": 0.05645993350911384, + "grad_norm": 32.12703697650007, + "learning_rate": 9.981700152780358e-07, + "loss": 0.5335044860839844, + "step": 1970 + }, + { + "epoch": 0.05660323283274103, + "grad_norm": 34.3499842533584, + "learning_rate": 9.981501257507863e-07, + "loss": 0.579246711730957, + "step": 1975 + }, + { + "epoch": 0.05674653215636822, + "grad_norm": 26.417964511351204, + "learning_rate": 9.981301289207617e-07, + "loss": 0.5574973583221435, + "step": 1980 + }, + { + "epoch": 0.05688983147999541, + "grad_norm": 18.171096516732877, + "learning_rate": 9.981100247922693e-07, + "loss": 0.532647705078125, + "step": 1985 + }, + { + "epoch": 0.05703313080362261, + "grad_norm": 29.25869874470219, + "learning_rate": 9.9808981336964e-07, + "loss": 0.5788944244384766, + "step": 1990 + }, + { + "epoch": 0.0571764301272498, + "grad_norm": 19.180780939224768, + "learning_rate": 9.98069494657227e-07, + "loss": 0.5830686569213868, + "step": 1995 + }, + { + "epoch": 0.057319729450876995, + "grad_norm": 18.633635853700614, + "learning_rate": 9.98049068659407e-07, + "loss": 0.5695031166076661, + "step": 2000 + }, + { + "epoch": 0.05746302877450418, + "grad_norm": 21.127046953266213, + "learning_rate": 9.9802853538058e-07, + "loss": 0.5626104354858399, + "step": 2005 + }, + { + "epoch": 0.057606328098131376, + "grad_norm": 42.11147974687228, + "learning_rate": 9.980078948251688e-07, + "loss": 0.574973201751709, + "step": 2010 + }, + { + "epoch": 0.05774962742175857, + "grad_norm": 35.57372861150963, + "learning_rate": 9.979871469976195e-07, + "loss": 0.5204398155212402, + "step": 2015 + }, + { + "epoch": 0.057892926745385764, + "grad_norm": 20.953804523174803, + "learning_rate": 9.979662919024012e-07, + "loss": 0.6023273468017578, + "step": 2020 + }, + { + "epoch": 0.05803622606901295, + "grad_norm": 30.753955029719254, + "learning_rate": 9.97945329544006e-07, + "loss": 0.5394299507141114, + "step": 2025 + }, + { + "epoch": 0.058179525392640145, + "grad_norm": 30.5465133623747, + "learning_rate": 9.979242599269497e-07, + "loss": 0.49974522590637205, + "step": 2030 + }, + { + "epoch": 0.05832282471626734, + "grad_norm": 46.366158018416314, + "learning_rate": 9.979030830557702e-07, + "loss": 0.579921817779541, + "step": 2035 + }, + { + "epoch": 0.05846612403989453, + "grad_norm": 37.912815727086716, + "learning_rate": 9.978817989350293e-07, + "loss": 0.5445592880249024, + "step": 2040 + }, + { + "epoch": 0.05860942336352173, + "grad_norm": 35.945710550946515, + "learning_rate": 9.978604075693117e-07, + "loss": 0.5547400951385498, + "step": 2045 + }, + { + "epoch": 0.058752722687148914, + "grad_norm": 22.596497540279845, + "learning_rate": 9.97838908963225e-07, + "loss": 0.5724043369293212, + "step": 2050 + }, + { + "epoch": 0.05889602201077611, + "grad_norm": 24.59772433223708, + "learning_rate": 9.978173031214001e-07, + "loss": 0.5646142959594727, + "step": 2055 + }, + { + "epoch": 0.0590393213344033, + "grad_norm": 18.500554819817953, + "learning_rate": 9.977955900484913e-07, + "loss": 0.5387094974517822, + "step": 2060 + }, + { + "epoch": 0.059182620658030496, + "grad_norm": 48.49378746842396, + "learning_rate": 9.97773769749175e-07, + "loss": 0.568783187866211, + "step": 2065 + }, + { + "epoch": 0.059325919981657683, + "grad_norm": 23.492431131201492, + "learning_rate": 9.97751842228152e-07, + "loss": 0.5180603504180908, + "step": 2070 + }, + { + "epoch": 0.05946921930528488, + "grad_norm": 35.758025842118535, + "learning_rate": 9.97729807490145e-07, + "loss": 0.5319781303405762, + "step": 2075 + }, + { + "epoch": 0.05961251862891207, + "grad_norm": 39.3449371076271, + "learning_rate": 9.977076655399007e-07, + "loss": 0.5683656692504883, + "step": 2080 + }, + { + "epoch": 0.059755817952539265, + "grad_norm": 21.78435094576682, + "learning_rate": 9.976854163821883e-07, + "loss": 0.5841338157653808, + "step": 2085 + }, + { + "epoch": 0.05989911727616646, + "grad_norm": 20.782284773044317, + "learning_rate": 9.976630600218005e-07, + "loss": 0.5238406181335449, + "step": 2090 + }, + { + "epoch": 0.06004241659979365, + "grad_norm": 47.65065504517986, + "learning_rate": 9.976405964635528e-07, + "loss": 0.5750688552856446, + "step": 2095 + }, + { + "epoch": 0.06018571592342084, + "grad_norm": 27.993491714596065, + "learning_rate": 9.97618025712284e-07, + "loss": 0.5586501598358155, + "step": 2100 + }, + { + "epoch": 0.06018571592342084, + "eval_bfov_iou": 0.7063012992368056, + "eval_bfov_iou@0.1": 0.976, + "eval_bfov_iou@0.25": 0.976, + "eval_bfov_iou@0.5": 0.944, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.4645714285714286, + "eval_exact_match": 0.3585, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 339.7009, + "eval_samples_per_second": 5.888, + "eval_steps_per_second": 0.185, + "eval_task_acc_absolute_direction_mc": 0.748, + "eval_task_acc_camera_rotation_transform_mc": 0.236, + "eval_task_acc_object_conditioned_reorientation_mc": 0.272, + "eval_task_acc_observer_distance_choice": 0.564, + "eval_task_acc_relative_3d_position_mc": 0.5, + "eval_task_acc_relative_direction_mc": 0.344, + "eval_task_acc_seam_continuity_mc": 0.588, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.944, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7063012992368056, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 2100 + }, + { + "epoch": 0.060329015247048035, + "grad_norm": 37.637867441444605, + "learning_rate": 9.975953477728557e-07, + "loss": 0.5351792812347412, + "step": 2105 + }, + { + "epoch": 0.06047231457067523, + "grad_norm": 22.83526254643094, + "learning_rate": 9.97572562650153e-07, + "loss": 0.516766357421875, + "step": 2110 + }, + { + "epoch": 0.060615613894302416, + "grad_norm": 97.37872702859023, + "learning_rate": 9.975496703490838e-07, + "loss": 0.5490057945251465, + "step": 2115 + }, + { + "epoch": 0.06075891321792961, + "grad_norm": 23.87977198145564, + "learning_rate": 9.975266708745793e-07, + "loss": 0.5263628005981446, + "step": 2120 + }, + { + "epoch": 0.060902212541556804, + "grad_norm": 37.16902050671432, + "learning_rate": 9.975035642315934e-07, + "loss": 0.5739933490753174, + "step": 2125 + }, + { + "epoch": 0.061045511865184, + "grad_norm": 37.88046404453032, + "learning_rate": 9.974803504251035e-07, + "loss": 0.5276651382446289, + "step": 2130 + }, + { + "epoch": 0.06118881118881119, + "grad_norm": 33.23428442203892, + "learning_rate": 9.974570294601096e-07, + "loss": 0.5317352771759033, + "step": 2135 + }, + { + "epoch": 0.06133211051243838, + "grad_norm": 30.6867130394758, + "learning_rate": 9.974336013416355e-07, + "loss": 0.5519020080566406, + "step": 2140 + }, + { + "epoch": 0.06147540983606557, + "grad_norm": 18.779566752606954, + "learning_rate": 9.974100660747276e-07, + "loss": 0.5632105827331543, + "step": 2145 + }, + { + "epoch": 0.06161870915969277, + "grad_norm": 21.722761486393825, + "learning_rate": 9.973864236644552e-07, + "loss": 0.5451555728912354, + "step": 2150 + }, + { + "epoch": 0.06176200848331996, + "grad_norm": 35.18057471964608, + "learning_rate": 9.97362674115911e-07, + "loss": 0.5790920257568359, + "step": 2155 + }, + { + "epoch": 0.061905307806947155, + "grad_norm": 22.878667630599466, + "learning_rate": 9.973388174342112e-07, + "loss": 0.5550158977508545, + "step": 2160 + }, + { + "epoch": 0.06204860713057434, + "grad_norm": 28.273538382309095, + "learning_rate": 9.97314853624494e-07, + "loss": 0.5470467567443847, + "step": 2165 + }, + { + "epoch": 0.062191906454201536, + "grad_norm": 58.89746344231349, + "learning_rate": 9.972907826919215e-07, + "loss": 0.6016593933105469, + "step": 2170 + }, + { + "epoch": 0.06233520577782873, + "grad_norm": 37.403888908961704, + "learning_rate": 9.972666046416784e-07, + "loss": 0.5454718589782714, + "step": 2175 + }, + { + "epoch": 0.062478505101455924, + "grad_norm": 58.49077103859525, + "learning_rate": 9.972423194789733e-07, + "loss": 0.590122127532959, + "step": 2180 + }, + { + "epoch": 0.06262180442508311, + "grad_norm": 29.368976709011726, + "learning_rate": 9.972179272090366e-07, + "loss": 0.5803613662719727, + "step": 2185 + }, + { + "epoch": 0.0627651037487103, + "grad_norm": 26.56949299933504, + "learning_rate": 9.971934278371228e-07, + "loss": 0.5887083530426025, + "step": 2190 + }, + { + "epoch": 0.0629084030723375, + "grad_norm": 23.73877268587442, + "learning_rate": 9.971688213685091e-07, + "loss": 0.5512824058532715, + "step": 2195 + }, + { + "epoch": 0.06305170239596469, + "grad_norm": 43.149980429705344, + "learning_rate": 9.971441078084959e-07, + "loss": 0.5461443901062012, + "step": 2200 + }, + { + "epoch": 0.06319500171959189, + "grad_norm": 198.66060689801802, + "learning_rate": 9.971192871624062e-07, + "loss": 0.5567688465118408, + "step": 2205 + }, + { + "epoch": 0.06333830104321908, + "grad_norm": 39.14406193882319, + "learning_rate": 9.970943594355868e-07, + "loss": 0.5450233459472656, + "step": 2210 + }, + { + "epoch": 0.06348160036684627, + "grad_norm": 26.86966621524003, + "learning_rate": 9.97069324633407e-07, + "loss": 0.5251582145690918, + "step": 2215 + }, + { + "epoch": 0.06362489969047345, + "grad_norm": 28.827531237015425, + "learning_rate": 9.970441827612595e-07, + "loss": 0.5495836734771729, + "step": 2220 + }, + { + "epoch": 0.06376819901410065, + "grad_norm": 23.106212303197097, + "learning_rate": 9.970189338245598e-07, + "loss": 0.5537035465240479, + "step": 2225 + }, + { + "epoch": 0.06391149833772784, + "grad_norm": 34.42365810264678, + "learning_rate": 9.969935778287466e-07, + "loss": 0.5509922981262207, + "step": 2230 + }, + { + "epoch": 0.06405479766135504, + "grad_norm": 48.15440517302124, + "learning_rate": 9.969681147792819e-07, + "loss": 0.5398993968963623, + "step": 2235 + }, + { + "epoch": 0.06419809698498223, + "grad_norm": 29.630823295761, + "learning_rate": 9.969425446816499e-07, + "loss": 0.5586915493011475, + "step": 2240 + }, + { + "epoch": 0.06434139630860942, + "grad_norm": 48.945806985547165, + "learning_rate": 9.969168675413591e-07, + "loss": 0.5244209289550781, + "step": 2245 + }, + { + "epoch": 0.06448469563223662, + "grad_norm": 35.28991301142812, + "learning_rate": 9.9689108336394e-07, + "loss": 0.5450331687927246, + "step": 2250 + }, + { + "epoch": 0.06462799495586381, + "grad_norm": 26.17817858631182, + "learning_rate": 9.96865192154947e-07, + "loss": 0.5360057830810547, + "step": 2255 + }, + { + "epoch": 0.064771294279491, + "grad_norm": 27.75483173502652, + "learning_rate": 9.968391939199565e-07, + "loss": 0.5114997863769531, + "step": 2260 + }, + { + "epoch": 0.06491459360311819, + "grad_norm": 42.47633146334045, + "learning_rate": 9.96813088664569e-07, + "loss": 0.5636953353881836, + "step": 2265 + }, + { + "epoch": 0.06505789292674538, + "grad_norm": 27.871205739433933, + "learning_rate": 9.96786876394408e-07, + "loss": 0.5596622467041016, + "step": 2270 + }, + { + "epoch": 0.06520119225037257, + "grad_norm": 25.03025318782488, + "learning_rate": 9.967605571151187e-07, + "loss": 0.5532896995544434, + "step": 2275 + }, + { + "epoch": 0.06534449157399977, + "grad_norm": 24.62921099593212, + "learning_rate": 9.967341308323713e-07, + "loss": 0.554608678817749, + "step": 2280 + }, + { + "epoch": 0.06548779089762696, + "grad_norm": 22.640054520422115, + "learning_rate": 9.967075975518575e-07, + "loss": 0.5418046951293946, + "step": 2285 + }, + { + "epoch": 0.06563109022125416, + "grad_norm": 18.82471036332898, + "learning_rate": 9.96680957279293e-07, + "loss": 0.5302847862243653, + "step": 2290 + }, + { + "epoch": 0.06577438954488135, + "grad_norm": 17.62441922679826, + "learning_rate": 9.966542100204159e-07, + "loss": 0.5292478561401367, + "step": 2295 + }, + { + "epoch": 0.06591768886850854, + "grad_norm": 30.90482487627282, + "learning_rate": 9.966273557809878e-07, + "loss": 0.5472880363464355, + "step": 2300 + }, + { + "epoch": 0.06606098819213574, + "grad_norm": 23.590316409300648, + "learning_rate": 9.966003945667932e-07, + "loss": 0.49915270805358886, + "step": 2305 + }, + { + "epoch": 0.06620428751576292, + "grad_norm": 34.74880348581048, + "learning_rate": 9.965733263836394e-07, + "loss": 0.5279040336608887, + "step": 2310 + }, + { + "epoch": 0.06634758683939011, + "grad_norm": 18.138262713791224, + "learning_rate": 9.96546151237357e-07, + "loss": 0.574882173538208, + "step": 2315 + }, + { + "epoch": 0.06649088616301731, + "grad_norm": 81.2710102090581, + "learning_rate": 9.965188691337997e-07, + "loss": 0.5851914882659912, + "step": 2320 + }, + { + "epoch": 0.0666341854866445, + "grad_norm": 50.351006718036196, + "learning_rate": 9.96491480078844e-07, + "loss": 0.5672521591186523, + "step": 2325 + }, + { + "epoch": 0.0667774848102717, + "grad_norm": 24.111022896105045, + "learning_rate": 9.964639840783898e-07, + "loss": 0.522936487197876, + "step": 2330 + }, + { + "epoch": 0.06692078413389889, + "grad_norm": 23.896338181793777, + "learning_rate": 9.9643638113836e-07, + "loss": 0.5476967334747315, + "step": 2335 + }, + { + "epoch": 0.06706408345752608, + "grad_norm": 24.148825711611842, + "learning_rate": 9.964086712646996e-07, + "loss": 0.5374104499816894, + "step": 2340 + }, + { + "epoch": 0.06720738278115328, + "grad_norm": 21.831265973890368, + "learning_rate": 9.963808544633777e-07, + "loss": 0.5281474590301514, + "step": 2345 + }, + { + "epoch": 0.06735068210478047, + "grad_norm": 32.74415546331606, + "learning_rate": 9.963529307403867e-07, + "loss": 0.5331390380859375, + "step": 2350 + }, + { + "epoch": 0.06749398142840765, + "grad_norm": 19.816898244469485, + "learning_rate": 9.963249001017405e-07, + "loss": 0.5320673942565918, + "step": 2355 + }, + { + "epoch": 0.06763728075203485, + "grad_norm": 19.877879563927692, + "learning_rate": 9.962967625534776e-07, + "loss": 0.5392120838165283, + "step": 2360 + }, + { + "epoch": 0.06778058007566204, + "grad_norm": 21.019108427169776, + "learning_rate": 9.962685181016586e-07, + "loss": 0.5417577743530273, + "step": 2365 + }, + { + "epoch": 0.06792387939928923, + "grad_norm": 29.535944080079616, + "learning_rate": 9.962401667523676e-07, + "loss": 0.5622740745544433, + "step": 2370 + }, + { + "epoch": 0.06806717872291643, + "grad_norm": 22.02064100167497, + "learning_rate": 9.962117085117117e-07, + "loss": 0.5347784042358399, + "step": 2375 + }, + { + "epoch": 0.06821047804654362, + "grad_norm": 20.39605504494229, + "learning_rate": 9.961831433858204e-07, + "loss": 0.4924062728881836, + "step": 2380 + }, + { + "epoch": 0.06835377737017082, + "grad_norm": 22.51561735126017, + "learning_rate": 9.96154471380847e-07, + "loss": 0.5699559211730957, + "step": 2385 + }, + { + "epoch": 0.06849707669379801, + "grad_norm": 20.786245126698912, + "learning_rate": 9.961256925029674e-07, + "loss": 0.522845458984375, + "step": 2390 + }, + { + "epoch": 0.0686403760174252, + "grad_norm": 23.32842670440012, + "learning_rate": 9.96096806758381e-07, + "loss": 0.5319356441497802, + "step": 2395 + }, + { + "epoch": 0.0687836753410524, + "grad_norm": 59.138017087446336, + "learning_rate": 9.960678141533094e-07, + "loss": 0.5262545585632324, + "step": 2400 + }, + { + "epoch": 0.0687836753410524, + "eval_bfov_iou": 0.7360317842821956, + "eval_bfov_iou@0.1": 0.98, + "eval_bfov_iou@0.25": 0.98, + "eval_bfov_iou@0.5": 0.968, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.49942857142857144, + "eval_exact_match": 0.3915, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 339.0048, + "eval_samples_per_second": 5.9, + "eval_steps_per_second": 0.186, + "eval_task_acc_absolute_direction_mc": 0.848, + "eval_task_acc_camera_rotation_transform_mc": 0.268, + "eval_task_acc_object_conditioned_reorientation_mc": 0.288, + "eval_task_acc_observer_distance_choice": 0.592, + "eval_task_acc_relative_3d_position_mc": 0.504, + "eval_task_acc_relative_direction_mc": 0.348, + "eval_task_acc_seam_continuity_mc": 0.648, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.98, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.98, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7360317842821956, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 2400 + }, + { + "epoch": 0.06892697466467958, + "grad_norm": 28.46340730112114, + "learning_rate": 9.96038714693998e-07, + "loss": 0.5385133743286132, + "step": 2405 + }, + { + "epoch": 0.06907027398830677, + "grad_norm": 34.960810920741594, + "learning_rate": 9.960095083867146e-07, + "loss": 0.5468213558197021, + "step": 2410 + }, + { + "epoch": 0.06921357331193397, + "grad_norm": 19.669926413606795, + "learning_rate": 9.959801952377504e-07, + "loss": 0.5099459171295166, + "step": 2415 + }, + { + "epoch": 0.06935687263556116, + "grad_norm": 23.808982211997584, + "learning_rate": 9.9595077525342e-07, + "loss": 0.4881103992462158, + "step": 2420 + }, + { + "epoch": 0.06950017195918835, + "grad_norm": 19.905918751563128, + "learning_rate": 9.959212484400597e-07, + "loss": 0.5512032032012939, + "step": 2425 + }, + { + "epoch": 0.06964347128281555, + "grad_norm": 26.167025081062057, + "learning_rate": 9.958916148040303e-07, + "loss": 0.5400328636169434, + "step": 2430 + }, + { + "epoch": 0.06978677060644274, + "grad_norm": 27.909571262725226, + "learning_rate": 9.958618743517146e-07, + "loss": 0.5294882297515869, + "step": 2435 + }, + { + "epoch": 0.06993006993006994, + "grad_norm": 46.5896078107343, + "learning_rate": 9.95832027089519e-07, + "loss": 0.5595605373382568, + "step": 2440 + }, + { + "epoch": 0.07007336925369713, + "grad_norm": 40.838002584612184, + "learning_rate": 9.958020730238726e-07, + "loss": 0.5901246070861816, + "step": 2445 + }, + { + "epoch": 0.07021666857732431, + "grad_norm": 21.14760519796573, + "learning_rate": 9.957720121612276e-07, + "loss": 0.5281941413879394, + "step": 2450 + }, + { + "epoch": 0.0703599679009515, + "grad_norm": 17.34163056630467, + "learning_rate": 9.957418445080593e-07, + "loss": 0.5230538368225097, + "step": 2455 + }, + { + "epoch": 0.0705032672245787, + "grad_norm": 25.662965251536143, + "learning_rate": 9.957115700708654e-07, + "loss": 0.5073868751525878, + "step": 2460 + }, + { + "epoch": 0.07064656654820589, + "grad_norm": 14.79963499520184, + "learning_rate": 9.956811888561676e-07, + "loss": 0.559490966796875, + "step": 2465 + }, + { + "epoch": 0.07078986587183309, + "grad_norm": 27.134124016716864, + "learning_rate": 9.956507008705099e-07, + "loss": 0.5268296241760254, + "step": 2470 + }, + { + "epoch": 0.07093316519546028, + "grad_norm": 16.201198126707357, + "learning_rate": 9.956201061204594e-07, + "loss": 0.5377682209014892, + "step": 2475 + }, + { + "epoch": 0.07107646451908747, + "grad_norm": 21.760682037902136, + "learning_rate": 9.955894046126066e-07, + "loss": 0.5289341926574707, + "step": 2480 + }, + { + "epoch": 0.07121976384271467, + "grad_norm": 16.575899996988653, + "learning_rate": 9.955585963535642e-07, + "loss": 0.5238601684570312, + "step": 2485 + }, + { + "epoch": 0.07136306316634186, + "grad_norm": 22.72543594239377, + "learning_rate": 9.95527681349969e-07, + "loss": 0.5727131843566895, + "step": 2490 + }, + { + "epoch": 0.07150636248996904, + "grad_norm": 18.37846026419657, + "learning_rate": 9.954966596084796e-07, + "loss": 0.5598538398742676, + "step": 2495 + }, + { + "epoch": 0.07164966181359624, + "grad_norm": 21.540311095522114, + "learning_rate": 9.954655311357782e-07, + "loss": 0.5875561714172364, + "step": 2500 + }, + { + "epoch": 0.07179296113722343, + "grad_norm": 18.622210433492086, + "learning_rate": 9.954342959385703e-07, + "loss": 0.5497575759887695, + "step": 2505 + }, + { + "epoch": 0.07193626046085062, + "grad_norm": 24.96077463429196, + "learning_rate": 9.954029540235839e-07, + "loss": 0.5521080970764161, + "step": 2510 + }, + { + "epoch": 0.07207955978447782, + "grad_norm": 24.7469741311417, + "learning_rate": 9.9537150539757e-07, + "loss": 0.5452692031860351, + "step": 2515 + }, + { + "epoch": 0.07222285910810501, + "grad_norm": 31.36210389016282, + "learning_rate": 9.95339950067303e-07, + "loss": 0.5227056980133057, + "step": 2520 + }, + { + "epoch": 0.0723661584317322, + "grad_norm": 26.92849407163919, + "learning_rate": 9.953082880395795e-07, + "loss": 0.5300332546234131, + "step": 2525 + }, + { + "epoch": 0.0725094577553594, + "grad_norm": 68.38974443546326, + "learning_rate": 9.952765193212202e-07, + "loss": 0.5640726089477539, + "step": 2530 + }, + { + "epoch": 0.0726527570789866, + "grad_norm": 23.379567458282466, + "learning_rate": 9.952446439190677e-07, + "loss": 0.5263796806335449, + "step": 2535 + }, + { + "epoch": 0.07279605640261377, + "grad_norm": 44.24496116116468, + "learning_rate": 9.95212661839988e-07, + "loss": 0.5237110614776611, + "step": 2540 + }, + { + "epoch": 0.07293935572624097, + "grad_norm": 21.801021867337507, + "learning_rate": 9.951805730908705e-07, + "loss": 0.580851936340332, + "step": 2545 + }, + { + "epoch": 0.07308265504986816, + "grad_norm": 58.91098156809349, + "learning_rate": 9.95148377678627e-07, + "loss": 0.5647574424743652, + "step": 2550 + }, + { + "epoch": 0.07322595437349536, + "grad_norm": 25.663774962069954, + "learning_rate": 9.951160756101924e-07, + "loss": 0.5560009002685546, + "step": 2555 + }, + { + "epoch": 0.07336925369712255, + "grad_norm": 21.281131266102445, + "learning_rate": 9.950836668925248e-07, + "loss": 0.5424549102783203, + "step": 2560 + }, + { + "epoch": 0.07351255302074974, + "grad_norm": 21.557432880370484, + "learning_rate": 9.95051151532605e-07, + "loss": 0.5357072830200196, + "step": 2565 + }, + { + "epoch": 0.07365585234437694, + "grad_norm": 27.974075773727954, + "learning_rate": 9.950185295374369e-07, + "loss": 0.547773790359497, + "step": 2570 + }, + { + "epoch": 0.07379915166800413, + "grad_norm": 24.19100315247805, + "learning_rate": 9.949858009140472e-07, + "loss": 0.5303547382354736, + "step": 2575 + }, + { + "epoch": 0.07394245099163133, + "grad_norm": 19.118725910422395, + "learning_rate": 9.949529656694861e-07, + "loss": 0.5418184757232666, + "step": 2580 + }, + { + "epoch": 0.0740857503152585, + "grad_norm": 24.895188154080966, + "learning_rate": 9.949200238108262e-07, + "loss": 0.5562070846557617, + "step": 2585 + }, + { + "epoch": 0.0742290496388857, + "grad_norm": 35.38434343359723, + "learning_rate": 9.948869753451632e-07, + "loss": 0.5491747379302978, + "step": 2590 + }, + { + "epoch": 0.0743723489625129, + "grad_norm": 28.05694734654616, + "learning_rate": 9.94853820279616e-07, + "loss": 0.5220667839050293, + "step": 2595 + }, + { + "epoch": 0.07451564828614009, + "grad_norm": 16.54283144733536, + "learning_rate": 9.94820558621326e-07, + "loss": 0.49973058700561523, + "step": 2600 + }, + { + "epoch": 0.07465894760976728, + "grad_norm": 27.84740719732308, + "learning_rate": 9.94787190377458e-07, + "loss": 0.5218687057495117, + "step": 2605 + }, + { + "epoch": 0.07480224693339448, + "grad_norm": 31.3334258724523, + "learning_rate": 9.947537155551997e-07, + "loss": 0.5317508697509765, + "step": 2610 + }, + { + "epoch": 0.07494554625702167, + "grad_norm": 19.928344027071326, + "learning_rate": 9.947201341617617e-07, + "loss": 0.4992988586425781, + "step": 2615 + }, + { + "epoch": 0.07508884558064886, + "grad_norm": 18.61327833268571, + "learning_rate": 9.946864462043771e-07, + "loss": 0.5186854362487793, + "step": 2620 + }, + { + "epoch": 0.07523214490427606, + "grad_norm": 34.70116313860689, + "learning_rate": 9.94652651690303e-07, + "loss": 0.5293817520141602, + "step": 2625 + }, + { + "epoch": 0.07537544422790324, + "grad_norm": 21.809264068631492, + "learning_rate": 9.946187506268182e-07, + "loss": 0.5128029346466064, + "step": 2630 + }, + { + "epoch": 0.07551874355153043, + "grad_norm": 25.055664293810246, + "learning_rate": 9.945847430212254e-07, + "loss": 0.5432379722595215, + "step": 2635 + }, + { + "epoch": 0.07566204287515763, + "grad_norm": 16.31994701829861, + "learning_rate": 9.9455062888085e-07, + "loss": 0.5415416717529297, + "step": 2640 + }, + { + "epoch": 0.07580534219878482, + "grad_norm": 25.27613041657911, + "learning_rate": 9.9451640821304e-07, + "loss": 0.5287370681762695, + "step": 2645 + }, + { + "epoch": 0.07594864152241201, + "grad_norm": 22.42047581694453, + "learning_rate": 9.94482081025167e-07, + "loss": 0.5460508823394775, + "step": 2650 + }, + { + "epoch": 0.07609194084603921, + "grad_norm": 26.095020931850982, + "learning_rate": 9.944476473246244e-07, + "loss": 0.5724791526794434, + "step": 2655 + }, + { + "epoch": 0.0762352401696664, + "grad_norm": 23.655590672935425, + "learning_rate": 9.944131071188302e-07, + "loss": 0.5637454986572266, + "step": 2660 + }, + { + "epoch": 0.0763785394932936, + "grad_norm": 23.22266914891859, + "learning_rate": 9.943784604152242e-07, + "loss": 0.5410524845123291, + "step": 2665 + }, + { + "epoch": 0.07652183881692079, + "grad_norm": 16.878734407034507, + "learning_rate": 9.94343707221269e-07, + "loss": 0.5322293281555176, + "step": 2670 + }, + { + "epoch": 0.07666513814054797, + "grad_norm": 118.1927660877049, + "learning_rate": 9.943088475444507e-07, + "loss": 0.5422255992889404, + "step": 2675 + }, + { + "epoch": 0.07680843746417516, + "grad_norm": 57.49469719246989, + "learning_rate": 9.942738813922787e-07, + "loss": 0.5521134853363037, + "step": 2680 + }, + { + "epoch": 0.07695173678780236, + "grad_norm": 23.66397559470668, + "learning_rate": 9.942388087722839e-07, + "loss": 0.5223199367523194, + "step": 2685 + }, + { + "epoch": 0.07709503611142955, + "grad_norm": 29.570862484454928, + "learning_rate": 9.942036296920216e-07, + "loss": 0.5610921382904053, + "step": 2690 + }, + { + "epoch": 0.07723833543505675, + "grad_norm": 23.891415738595562, + "learning_rate": 9.941683441590693e-07, + "loss": 0.5709507942199707, + "step": 2695 + }, + { + "epoch": 0.07738163475868394, + "grad_norm": 19.42587168319658, + "learning_rate": 9.941329521810277e-07, + "loss": 0.5594826698303222, + "step": 2700 + }, + { + "epoch": 0.07738163475868394, + "eval_bfov_iou": 0.7721981076910327, + "eval_bfov_iou@0.1": 0.98, + "eval_bfov_iou@0.25": 0.972, + "eval_bfov_iou@0.5": 0.964, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5171428571428571, + "eval_exact_match": 0.4335, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 336.2734, + "eval_samples_per_second": 5.948, + "eval_steps_per_second": 0.187, + "eval_task_acc_absolute_direction_mc": 0.852, + "eval_task_acc_camera_rotation_transform_mc": 0.288, + "eval_task_acc_object_conditioned_reorientation_mc": 0.304, + "eval_task_acc_observer_distance_choice": 0.548, + "eval_task_acc_relative_3d_position_mc": 0.54, + "eval_task_acc_relative_direction_mc": 0.388, + "eval_task_acc_seam_continuity_mc": 0.7, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.98, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.964, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7721981076910327, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 2700 + }, + { + "epoch": 0.07752493408231113, + "grad_norm": 16.76242564031885, + "learning_rate": 9.940974537655203e-07, + "loss": 0.5312869548797607, + "step": 2705 + }, + { + "epoch": 0.07766823340593833, + "grad_norm": 25.264774250253815, + "learning_rate": 9.940618489201933e-07, + "loss": 0.5273028373718261, + "step": 2710 + }, + { + "epoch": 0.07781153272956552, + "grad_norm": 20.15943265078316, + "learning_rate": 9.940261376527166e-07, + "loss": 0.5225157737731934, + "step": 2715 + }, + { + "epoch": 0.07795483205319272, + "grad_norm": 23.83191134093326, + "learning_rate": 9.939903199707818e-07, + "loss": 0.5472304344177246, + "step": 2720 + }, + { + "epoch": 0.0780981313768199, + "grad_norm": 14.663631641329067, + "learning_rate": 9.939543958821045e-07, + "loss": 0.58319091796875, + "step": 2725 + }, + { + "epoch": 0.07824143070044709, + "grad_norm": 16.62032631478992, + "learning_rate": 9.939183653944232e-07, + "loss": 0.5544636249542236, + "step": 2730 + }, + { + "epoch": 0.07838473002407428, + "grad_norm": 18.011240085924307, + "learning_rate": 9.938822285154981e-07, + "loss": 0.5667471885681152, + "step": 2735 + }, + { + "epoch": 0.07852802934770148, + "grad_norm": 19.792123271142806, + "learning_rate": 9.93845985253114e-07, + "loss": 0.5081260681152344, + "step": 2740 + }, + { + "epoch": 0.07867132867132867, + "grad_norm": 22.1425339338076, + "learning_rate": 9.938096356150772e-07, + "loss": 0.5615932464599609, + "step": 2745 + }, + { + "epoch": 0.07881462799495587, + "grad_norm": 14.916121112631782, + "learning_rate": 9.937731796092178e-07, + "loss": 0.5489027976989747, + "step": 2750 + }, + { + "epoch": 0.07895792731858306, + "grad_norm": 15.843145698586431, + "learning_rate": 9.937366172433884e-07, + "loss": 0.5268912315368652, + "step": 2755 + }, + { + "epoch": 0.07910122664221025, + "grad_norm": 20.758942282988976, + "learning_rate": 9.936999485254647e-07, + "loss": 0.5376805782318115, + "step": 2760 + }, + { + "epoch": 0.07924452596583745, + "grad_norm": 16.73069976597231, + "learning_rate": 9.936631734633453e-07, + "loss": 0.5186863899230957, + "step": 2765 + }, + { + "epoch": 0.07938782528946463, + "grad_norm": 21.737662419629128, + "learning_rate": 9.936262920649513e-07, + "loss": 0.5180713176727295, + "step": 2770 + }, + { + "epoch": 0.07953112461309182, + "grad_norm": 48.89726899754624, + "learning_rate": 9.935893043382277e-07, + "loss": 0.5091361999511719, + "step": 2775 + }, + { + "epoch": 0.07967442393671902, + "grad_norm": 13.931594959437342, + "learning_rate": 9.93552210291141e-07, + "loss": 0.5550099849700928, + "step": 2780 + }, + { + "epoch": 0.07981772326034621, + "grad_norm": 16.74572194316923, + "learning_rate": 9.935150099316818e-07, + "loss": 0.5389566421508789, + "step": 2785 + }, + { + "epoch": 0.0799610225839734, + "grad_norm": 13.053105232783706, + "learning_rate": 9.934777032678632e-07, + "loss": 0.5275240421295166, + "step": 2790 + }, + { + "epoch": 0.0801043219076006, + "grad_norm": 19.74556967386735, + "learning_rate": 9.934402903077206e-07, + "loss": 0.5515280723571777, + "step": 2795 + }, + { + "epoch": 0.08024762123122779, + "grad_norm": 76.33375751952134, + "learning_rate": 9.934027710593136e-07, + "loss": 0.5769891262054443, + "step": 2800 + }, + { + "epoch": 0.08039092055485499, + "grad_norm": 26.963914609200874, + "learning_rate": 9.933651455307233e-07, + "loss": 0.5260500907897949, + "step": 2805 + }, + { + "epoch": 0.08053421987848218, + "grad_norm": 27.757102395234018, + "learning_rate": 9.933274137300548e-07, + "loss": 0.5139936923980712, + "step": 2810 + }, + { + "epoch": 0.08067751920210936, + "grad_norm": 29.63954749323088, + "learning_rate": 9.932895756654353e-07, + "loss": 0.578929853439331, + "step": 2815 + }, + { + "epoch": 0.08082081852573655, + "grad_norm": 32.24503997689612, + "learning_rate": 9.932516313450154e-07, + "loss": 0.5367796897888184, + "step": 2820 + }, + { + "epoch": 0.08096411784936375, + "grad_norm": 31.493422130161697, + "learning_rate": 9.932135807769683e-07, + "loss": 0.5031028747558594, + "step": 2825 + }, + { + "epoch": 0.08110741717299094, + "grad_norm": 26.445924307582548, + "learning_rate": 9.931754239694904e-07, + "loss": 0.5435145854949951, + "step": 2830 + }, + { + "epoch": 0.08125071649661814, + "grad_norm": 29.18377219140894, + "learning_rate": 9.931371609308005e-07, + "loss": 0.5260499000549317, + "step": 2835 + }, + { + "epoch": 0.08139401582024533, + "grad_norm": 23.576424566492438, + "learning_rate": 9.930987916691406e-07, + "loss": 0.5387123107910157, + "step": 2840 + }, + { + "epoch": 0.08153731514387252, + "grad_norm": 24.786626136401896, + "learning_rate": 9.930603161927755e-07, + "loss": 0.4832889556884766, + "step": 2845 + }, + { + "epoch": 0.08168061446749972, + "grad_norm": 28.15684308190436, + "learning_rate": 9.930217345099932e-07, + "loss": 0.5297474384307861, + "step": 2850 + }, + { + "epoch": 0.08182391379112691, + "grad_norm": 46.0742346231521, + "learning_rate": 9.92983046629104e-07, + "loss": 0.5509745597839355, + "step": 2855 + }, + { + "epoch": 0.08196721311475409, + "grad_norm": 22.4774123176724, + "learning_rate": 9.929442525584415e-07, + "loss": 0.5158735752105713, + "step": 2860 + }, + { + "epoch": 0.08211051243838129, + "grad_norm": 26.807380566126565, + "learning_rate": 9.92905352306362e-07, + "loss": 0.5375164031982422, + "step": 2865 + }, + { + "epoch": 0.08225381176200848, + "grad_norm": 33.75117182511355, + "learning_rate": 9.928663458812444e-07, + "loss": 0.5031775951385498, + "step": 2870 + }, + { + "epoch": 0.08239711108563567, + "grad_norm": 24.25135453596808, + "learning_rate": 9.928272332914916e-07, + "loss": 0.5269863128662109, + "step": 2875 + }, + { + "epoch": 0.08254041040926287, + "grad_norm": 15.07977454773422, + "learning_rate": 9.927880145455275e-07, + "loss": 0.5251748085021972, + "step": 2880 + }, + { + "epoch": 0.08268370973289006, + "grad_norm": 18.094219034259286, + "learning_rate": 9.92748689651801e-07, + "loss": 0.5407743453979492, + "step": 2885 + }, + { + "epoch": 0.08282700905651726, + "grad_norm": 15.463783214110725, + "learning_rate": 9.927092586187819e-07, + "loss": 0.5228888988494873, + "step": 2890 + }, + { + "epoch": 0.08297030838014445, + "grad_norm": 25.639359706344386, + "learning_rate": 9.926697214549643e-07, + "loss": 0.5132462501525878, + "step": 2895 + }, + { + "epoch": 0.08311360770377164, + "grad_norm": 22.732220405259024, + "learning_rate": 9.92630078168864e-07, + "loss": 0.5619603157043457, + "step": 2900 + }, + { + "epoch": 0.08325690702739882, + "grad_norm": 40.10465972059587, + "learning_rate": 9.925903287690209e-07, + "loss": 0.5325672149658203, + "step": 2905 + }, + { + "epoch": 0.08340020635102602, + "grad_norm": 19.83890496699772, + "learning_rate": 9.92550473263997e-07, + "loss": 0.5411595344543457, + "step": 2910 + }, + { + "epoch": 0.08354350567465321, + "grad_norm": 31.327298277680427, + "learning_rate": 9.925105116623767e-07, + "loss": 0.5136354923248291, + "step": 2915 + }, + { + "epoch": 0.0836868049982804, + "grad_norm": 16.443672747957653, + "learning_rate": 9.924704439727685e-07, + "loss": 0.5286950588226318, + "step": 2920 + }, + { + "epoch": 0.0838301043219076, + "grad_norm": 40.67689187557115, + "learning_rate": 9.92430270203803e-07, + "loss": 0.5190472602844238, + "step": 2925 + }, + { + "epoch": 0.0839734036455348, + "grad_norm": 35.43556403160313, + "learning_rate": 9.923899903641332e-07, + "loss": 0.5112854957580566, + "step": 2930 + }, + { + "epoch": 0.08411670296916199, + "grad_norm": 15.58123346464293, + "learning_rate": 9.923496044624361e-07, + "loss": 0.5089241981506347, + "step": 2935 + }, + { + "epoch": 0.08426000229278918, + "grad_norm": 32.78167017545767, + "learning_rate": 9.923091125074109e-07, + "loss": 0.5032940864562988, + "step": 2940 + }, + { + "epoch": 0.08440330161641638, + "grad_norm": 26.286917044106097, + "learning_rate": 9.922685145077792e-07, + "loss": 0.5369332313537598, + "step": 2945 + }, + { + "epoch": 0.08454660094004356, + "grad_norm": 25.882304485178505, + "learning_rate": 9.922278104722862e-07, + "loss": 0.5279065132141113, + "step": 2950 + }, + { + "epoch": 0.08468990026367075, + "grad_norm": 22.519743613388034, + "learning_rate": 9.921870004096993e-07, + "loss": 0.517902135848999, + "step": 2955 + }, + { + "epoch": 0.08483319958729794, + "grad_norm": 51.87414766891269, + "learning_rate": 9.921460843288096e-07, + "loss": 0.5578441143035888, + "step": 2960 + }, + { + "epoch": 0.08497649891092514, + "grad_norm": 29.939580014243926, + "learning_rate": 9.921050622384304e-07, + "loss": 0.4678792476654053, + "step": 2965 + }, + { + "epoch": 0.08511979823455233, + "grad_norm": 35.809992854234416, + "learning_rate": 9.92063934147398e-07, + "loss": 0.5241620540618896, + "step": 2970 + }, + { + "epoch": 0.08526309755817953, + "grad_norm": 42.02305554470282, + "learning_rate": 9.920227000645712e-07, + "loss": 0.597658348083496, + "step": 2975 + }, + { + "epoch": 0.08540639688180672, + "grad_norm": 19.92568453823032, + "learning_rate": 9.91981359998832e-07, + "loss": 0.5522371292114258, + "step": 2980 + }, + { + "epoch": 0.08554969620543391, + "grad_norm": 20.558036971774108, + "learning_rate": 9.919399139590855e-07, + "loss": 0.5625419616699219, + "step": 2985 + }, + { + "epoch": 0.08569299552906111, + "grad_norm": 28.810740213523143, + "learning_rate": 9.918983619542587e-07, + "loss": 0.5099779605865479, + "step": 2990 + }, + { + "epoch": 0.08583629485268829, + "grad_norm": 24.467812177866335, + "learning_rate": 9.918567039933026e-07, + "loss": 0.5113654136657715, + "step": 2995 + }, + { + "epoch": 0.08597959417631548, + "grad_norm": 29.780874678622272, + "learning_rate": 9.918149400851899e-07, + "loss": 0.5125518798828125, + "step": 3000 + }, + { + "epoch": 0.08597959417631548, + "eval_bfov_iou": 0.7283661378329055, + "eval_bfov_iou@0.1": 0.98, + "eval_bfov_iou@0.25": 0.972, + "eval_bfov_iou@0.5": 0.964, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5194285714285715, + "eval_exact_match": 0.3965, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 349.8638, + "eval_samples_per_second": 5.717, + "eval_steps_per_second": 0.18, + "eval_task_acc_absolute_direction_mc": 0.828, + "eval_task_acc_camera_rotation_transform_mc": 0.288, + "eval_task_acc_object_conditioned_reorientation_mc": 0.348, + "eval_task_acc_observer_distance_choice": 0.564, + "eval_task_acc_relative_3d_position_mc": 0.496, + "eval_task_acc_relative_direction_mc": 0.412, + "eval_task_acc_seam_continuity_mc": 0.7, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.98, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.964, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7283661378329055, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 3000 + }, + { + "epoch": 0.08612289349994268, + "grad_norm": 14.335950792612062, + "learning_rate": 9.917730702389172e-07, + "loss": 0.5042225360870362, + "step": 3005 + }, + { + "epoch": 0.08626619282356987, + "grad_norm": 25.37390996524324, + "learning_rate": 9.917310944635029e-07, + "loss": 0.5197614192962646, + "step": 3010 + }, + { + "epoch": 0.08640949214719706, + "grad_norm": 18.366551852195375, + "learning_rate": 9.916890127679888e-07, + "loss": 0.4907322883605957, + "step": 3015 + }, + { + "epoch": 0.08655279147082426, + "grad_norm": 32.63861750115156, + "learning_rate": 9.916468251614397e-07, + "loss": 0.5742916584014892, + "step": 3020 + }, + { + "epoch": 0.08669609079445145, + "grad_norm": 20.55950668162522, + "learning_rate": 9.916045316529425e-07, + "loss": 0.5101470947265625, + "step": 3025 + }, + { + "epoch": 0.08683939011807865, + "grad_norm": 16.129541742992892, + "learning_rate": 9.915621322516073e-07, + "loss": 0.5298290252685547, + "step": 3030 + }, + { + "epoch": 0.08698268944170584, + "grad_norm": 39.33258247012586, + "learning_rate": 9.915196269665677e-07, + "loss": 0.5268573760986328, + "step": 3035 + }, + { + "epoch": 0.08712598876533303, + "grad_norm": 21.15325131151765, + "learning_rate": 9.914770158069788e-07, + "loss": 0.5017885684967041, + "step": 3040 + }, + { + "epoch": 0.08726928808896021, + "grad_norm": 24.389067884887904, + "learning_rate": 9.914342987820194e-07, + "loss": 0.5390908241271972, + "step": 3045 + }, + { + "epoch": 0.08741258741258741, + "grad_norm": 17.42198164127877, + "learning_rate": 9.913914759008905e-07, + "loss": 0.5043983459472656, + "step": 3050 + }, + { + "epoch": 0.0875558867362146, + "grad_norm": 75.47060515490065, + "learning_rate": 9.91348547172817e-07, + "loss": 0.5201051712036133, + "step": 3055 + }, + { + "epoch": 0.0876991860598418, + "grad_norm": 32.22895458174531, + "learning_rate": 9.91305512607045e-07, + "loss": 0.5455232620239258, + "step": 3060 + }, + { + "epoch": 0.08784248538346899, + "grad_norm": 23.737330986004533, + "learning_rate": 9.912623722128448e-07, + "loss": 0.5340705394744873, + "step": 3065 + }, + { + "epoch": 0.08798578470709618, + "grad_norm": 41.07393725043532, + "learning_rate": 9.912191259995088e-07, + "loss": 0.5200640678405761, + "step": 3070 + }, + { + "epoch": 0.08812908403072338, + "grad_norm": 15.081963740074723, + "learning_rate": 9.911757739763525e-07, + "loss": 0.5320433616638184, + "step": 3075 + }, + { + "epoch": 0.08827238335435057, + "grad_norm": 19.25442703778434, + "learning_rate": 9.911323161527137e-07, + "loss": 0.5212348937988281, + "step": 3080 + }, + { + "epoch": 0.08841568267797777, + "grad_norm": 25.896415369054463, + "learning_rate": 9.910887525379536e-07, + "loss": 0.5380565643310546, + "step": 3085 + }, + { + "epoch": 0.08855898200160495, + "grad_norm": 16.88161542739723, + "learning_rate": 9.910450831414556e-07, + "loss": 0.5295086860656738, + "step": 3090 + }, + { + "epoch": 0.08870228132523214, + "grad_norm": 31.265680607886864, + "learning_rate": 9.910013079726266e-07, + "loss": 0.5480732917785645, + "step": 3095 + }, + { + "epoch": 0.08884558064885933, + "grad_norm": 50.705030410190076, + "learning_rate": 9.909574270408958e-07, + "loss": 0.5327776908874512, + "step": 3100 + }, + { + "epoch": 0.08898887997248653, + "grad_norm": 59.11315649572405, + "learning_rate": 9.909134403557148e-07, + "loss": 0.5702178001403808, + "step": 3105 + }, + { + "epoch": 0.08913217929611372, + "grad_norm": 18.182148527467746, + "learning_rate": 9.908693479265592e-07, + "loss": 0.5239349365234375, + "step": 3110 + }, + { + "epoch": 0.08927547861974092, + "grad_norm": 21.706431244796562, + "learning_rate": 9.90825149762926e-07, + "loss": 0.5321457386016846, + "step": 3115 + }, + { + "epoch": 0.08941877794336811, + "grad_norm": 20.166080034602384, + "learning_rate": 9.907808458743358e-07, + "loss": 0.5293474197387695, + "step": 3120 + }, + { + "epoch": 0.0895620772669953, + "grad_norm": 26.902463600340287, + "learning_rate": 9.907364362703315e-07, + "loss": 0.49239072799682615, + "step": 3125 + }, + { + "epoch": 0.0897053765906225, + "grad_norm": 25.35268404453983, + "learning_rate": 9.9069192096048e-07, + "loss": 0.48281135559082033, + "step": 3130 + }, + { + "epoch": 0.08984867591424968, + "grad_norm": 44.94944119027543, + "learning_rate": 9.906472999543688e-07, + "loss": 0.546223783493042, + "step": 3135 + }, + { + "epoch": 0.08999197523787687, + "grad_norm": 29.356869122778424, + "learning_rate": 9.9060257326161e-07, + "loss": 0.47902531623840333, + "step": 3140 + }, + { + "epoch": 0.09013527456150407, + "grad_norm": 39.84987666338268, + "learning_rate": 9.905577408918377e-07, + "loss": 0.5715572357177734, + "step": 3145 + }, + { + "epoch": 0.09027857388513126, + "grad_norm": 17.88106170512711, + "learning_rate": 9.90512802854709e-07, + "loss": 0.49596076011657714, + "step": 3150 + }, + { + "epoch": 0.09042187320875845, + "grad_norm": 38.16937052947071, + "learning_rate": 9.904677591599036e-07, + "loss": 0.5323156833648681, + "step": 3155 + }, + { + "epoch": 0.09056517253238565, + "grad_norm": 22.049206027624557, + "learning_rate": 9.904226098171238e-07, + "loss": 0.5108067512512207, + "step": 3160 + }, + { + "epoch": 0.09070847185601284, + "grad_norm": 17.57758926897527, + "learning_rate": 9.903773548360955e-07, + "loss": 0.5425436973571778, + "step": 3165 + }, + { + "epoch": 0.09085177117964004, + "grad_norm": 18.274406802149226, + "learning_rate": 9.903319942265662e-07, + "loss": 0.518244743347168, + "step": 3170 + }, + { + "epoch": 0.09099507050326723, + "grad_norm": 16.406831345082868, + "learning_rate": 9.902865279983067e-07, + "loss": 0.5040255546569824, + "step": 3175 + }, + { + "epoch": 0.09113836982689441, + "grad_norm": 27.567746820159503, + "learning_rate": 9.902409561611107e-07, + "loss": 0.47188420295715333, + "step": 3180 + }, + { + "epoch": 0.0912816691505216, + "grad_norm": 35.9187317385404, + "learning_rate": 9.901952787247945e-07, + "loss": 0.5349905014038085, + "step": 3185 + }, + { + "epoch": 0.0914249684741488, + "grad_norm": 28.151865189159757, + "learning_rate": 9.901494956991972e-07, + "loss": 0.502873706817627, + "step": 3190 + }, + { + "epoch": 0.09156826779777599, + "grad_norm": 20.634595900679493, + "learning_rate": 9.901036070941804e-07, + "loss": 0.5114718914031983, + "step": 3195 + }, + { + "epoch": 0.09171156712140319, + "grad_norm": 44.13481805783381, + "learning_rate": 9.900576129196286e-07, + "loss": 0.5260309219360352, + "step": 3200 + }, + { + "epoch": 0.09185486644503038, + "grad_norm": 25.237879256310034, + "learning_rate": 9.900115131854492e-07, + "loss": 0.5185188293457031, + "step": 3205 + }, + { + "epoch": 0.09199816576865757, + "grad_norm": 15.935166027394915, + "learning_rate": 9.899653079015722e-07, + "loss": 0.5157188415527344, + "step": 3210 + }, + { + "epoch": 0.09214146509228477, + "grad_norm": 38.90603179829148, + "learning_rate": 9.899189970779501e-07, + "loss": 0.5227045536041259, + "step": 3215 + }, + { + "epoch": 0.09228476441591196, + "grad_norm": 18.157071653788275, + "learning_rate": 9.898725807245589e-07, + "loss": 0.5072156429290772, + "step": 3220 + }, + { + "epoch": 0.09242806373953914, + "grad_norm": 18.241295322219784, + "learning_rate": 9.898260588513961e-07, + "loss": 0.5134231090545655, + "step": 3225 + }, + { + "epoch": 0.09257136306316634, + "grad_norm": 19.66659672490877, + "learning_rate": 9.89779431468483e-07, + "loss": 0.5088551044464111, + "step": 3230 + }, + { + "epoch": 0.09271466238679353, + "grad_norm": 29.092461906447404, + "learning_rate": 9.897326985858633e-07, + "loss": 0.5190189361572266, + "step": 3235 + }, + { + "epoch": 0.09285796171042072, + "grad_norm": 34.971665196193825, + "learning_rate": 9.896858602136035e-07, + "loss": 0.5362978935241699, + "step": 3240 + }, + { + "epoch": 0.09300126103404792, + "grad_norm": 49.75182325222677, + "learning_rate": 9.896389163617923e-07, + "loss": 0.5134912014007569, + "step": 3245 + }, + { + "epoch": 0.09314456035767511, + "grad_norm": 48.697388151584306, + "learning_rate": 9.895918670405418e-07, + "loss": 0.5339129447937012, + "step": 3250 + }, + { + "epoch": 0.09328785968130231, + "grad_norm": 24.25383544819964, + "learning_rate": 9.895447122599864e-07, + "loss": 0.5009629249572753, + "step": 3255 + }, + { + "epoch": 0.0934311590049295, + "grad_norm": 31.58148109828485, + "learning_rate": 9.894974520302834e-07, + "loss": 0.5412585735321045, + "step": 3260 + }, + { + "epoch": 0.0935744583285567, + "grad_norm": 22.081732916348027, + "learning_rate": 9.894500863616128e-07, + "loss": 0.5039048194885254, + "step": 3265 + }, + { + "epoch": 0.09371775765218388, + "grad_norm": 25.80547425692157, + "learning_rate": 9.894026152641774e-07, + "loss": 0.5130791664123535, + "step": 3270 + }, + { + "epoch": 0.09386105697581107, + "grad_norm": 26.792823312651997, + "learning_rate": 9.893550387482024e-07, + "loss": 0.5074618339538575, + "step": 3275 + }, + { + "epoch": 0.09400435629943826, + "grad_norm": 57.205415198742664, + "learning_rate": 9.893073568239358e-07, + "loss": 0.5286671161651612, + "step": 3280 + }, + { + "epoch": 0.09414765562306546, + "grad_norm": 33.48179803313024, + "learning_rate": 9.892595695016489e-07, + "loss": 0.5653787612915039, + "step": 3285 + }, + { + "epoch": 0.09429095494669265, + "grad_norm": 22.90157133496223, + "learning_rate": 9.892116767916347e-07, + "loss": 0.516090202331543, + "step": 3290 + }, + { + "epoch": 0.09443425427031985, + "grad_norm": 29.503112039008663, + "learning_rate": 9.891636787042094e-07, + "loss": 0.5422289371490479, + "step": 3295 + }, + { + "epoch": 0.09457755359394704, + "grad_norm": 42.84403332352723, + "learning_rate": 9.891155752497123e-07, + "loss": 0.5153655052185059, + "step": 3300 + }, + { + "epoch": 0.09457755359394704, + "eval_bfov_iou": 0.7837141948472952, + "eval_bfov_iou@0.1": 0.988, + "eval_bfov_iou@0.25": 0.984, + "eval_bfov_iou@0.5": 0.976, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5222857142857142, + "eval_exact_match": 0.429, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 333.9741, + "eval_samples_per_second": 5.988, + "eval_steps_per_second": 0.189, + "eval_task_acc_absolute_direction_mc": 0.86, + "eval_task_acc_camera_rotation_transform_mc": 0.256, + "eval_task_acc_object_conditioned_reorientation_mc": 0.328, + "eval_task_acc_observer_distance_choice": 0.608, + "eval_task_acc_relative_3d_position_mc": 0.54, + "eval_task_acc_relative_direction_mc": 0.384, + "eval_task_acc_seam_continuity_mc": 0.68, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.988, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.984, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7837141948472952, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 3300 + }, + { + "epoch": 0.09472085291757423, + "grad_norm": 30.258025394696695, + "learning_rate": 9.89067366438505e-07, + "loss": 0.52822265625, + "step": 3305 + }, + { + "epoch": 0.09486415224120143, + "grad_norm": 13.34229527326553, + "learning_rate": 9.890190522809715e-07, + "loss": 0.5266654968261719, + "step": 3310 + }, + { + "epoch": 0.09500745156482861, + "grad_norm": 20.40522599715385, + "learning_rate": 9.889706327875187e-07, + "loss": 0.5193912506103515, + "step": 3315 + }, + { + "epoch": 0.0951507508884558, + "grad_norm": 16.56246465328198, + "learning_rate": 9.889221079685765e-07, + "loss": 0.5100608825683594, + "step": 3320 + }, + { + "epoch": 0.095294050212083, + "grad_norm": 32.57871650198156, + "learning_rate": 9.888734778345972e-07, + "loss": 0.5257948875427246, + "step": 3325 + }, + { + "epoch": 0.09543734953571019, + "grad_norm": 21.40156096528397, + "learning_rate": 9.88824742396056e-07, + "loss": 0.5275650978088379, + "step": 3330 + }, + { + "epoch": 0.09558064885933738, + "grad_norm": 16.04221501383625, + "learning_rate": 9.887759016634505e-07, + "loss": 0.5476567268371582, + "step": 3335 + }, + { + "epoch": 0.09572394818296458, + "grad_norm": 24.442212805313257, + "learning_rate": 9.887269556473013e-07, + "loss": 0.5276049613952637, + "step": 3340 + }, + { + "epoch": 0.09586724750659177, + "grad_norm": 26.57305749533102, + "learning_rate": 9.886779043581512e-07, + "loss": 0.5246015548706054, + "step": 3345 + }, + { + "epoch": 0.09601054683021897, + "grad_norm": 20.8749380722424, + "learning_rate": 9.88628747806566e-07, + "loss": 0.5454081058502197, + "step": 3350 + }, + { + "epoch": 0.09615384615384616, + "grad_norm": 24.919044927582725, + "learning_rate": 9.885794860031343e-07, + "loss": 0.5231195449829101, + "step": 3355 + }, + { + "epoch": 0.09629714547747335, + "grad_norm": 30.10529584222661, + "learning_rate": 9.885301189584673e-07, + "loss": 0.5001602649688721, + "step": 3360 + }, + { + "epoch": 0.09644044480110053, + "grad_norm": 22.527673072505614, + "learning_rate": 9.884806466831984e-07, + "loss": 0.4897623538970947, + "step": 3365 + }, + { + "epoch": 0.09658374412472773, + "grad_norm": 31.577955040575638, + "learning_rate": 9.884310691879844e-07, + "loss": 0.523357629776001, + "step": 3370 + }, + { + "epoch": 0.09672704344835492, + "grad_norm": 20.833350814313576, + "learning_rate": 9.883813864835044e-07, + "loss": 0.5363403797149658, + "step": 3375 + }, + { + "epoch": 0.09687034277198212, + "grad_norm": 21.67574561479277, + "learning_rate": 9.883315985804598e-07, + "loss": 0.5363715171813965, + "step": 3380 + }, + { + "epoch": 0.09701364209560931, + "grad_norm": 17.99277578204225, + "learning_rate": 9.882817054895757e-07, + "loss": 0.5099105358123779, + "step": 3385 + }, + { + "epoch": 0.0971569414192365, + "grad_norm": 20.49242018864393, + "learning_rate": 9.882317072215987e-07, + "loss": 0.525055980682373, + "step": 3390 + }, + { + "epoch": 0.0973002407428637, + "grad_norm": 35.44131196283185, + "learning_rate": 9.881816037872985e-07, + "loss": 0.49782428741455076, + "step": 3395 + }, + { + "epoch": 0.09744354006649089, + "grad_norm": 95.59918082021525, + "learning_rate": 9.88131395197468e-07, + "loss": 0.5124666213989257, + "step": 3400 + }, + { + "epoch": 0.09758683939011809, + "grad_norm": 30.09064747558733, + "learning_rate": 9.880810814629217e-07, + "loss": 0.5339958190917968, + "step": 3405 + }, + { + "epoch": 0.09773013871374527, + "grad_norm": 32.12823907220615, + "learning_rate": 9.880306625944974e-07, + "loss": 0.4584778308868408, + "step": 3410 + }, + { + "epoch": 0.09787343803737246, + "grad_norm": 40.99673772015537, + "learning_rate": 9.879801386030558e-07, + "loss": 0.49283828735351565, + "step": 3415 + }, + { + "epoch": 0.09801673736099965, + "grad_norm": 24.881727680389236, + "learning_rate": 9.879295094994798e-07, + "loss": 0.5150506019592285, + "step": 3420 + }, + { + "epoch": 0.09816003668462685, + "grad_norm": 34.19877531903642, + "learning_rate": 9.878787752946746e-07, + "loss": 0.5144412040710449, + "step": 3425 + }, + { + "epoch": 0.09830333600825404, + "grad_norm": 35.73346601435321, + "learning_rate": 9.878279359995689e-07, + "loss": 0.487253475189209, + "step": 3430 + }, + { + "epoch": 0.09844663533188124, + "grad_norm": 33.144994103457044, + "learning_rate": 9.877769916251137e-07, + "loss": 0.509460163116455, + "step": 3435 + }, + { + "epoch": 0.09858993465550843, + "grad_norm": 27.089464972299055, + "learning_rate": 9.87725942182282e-07, + "loss": 0.5506721496582031, + "step": 3440 + }, + { + "epoch": 0.09873323397913562, + "grad_norm": 125.16684690532983, + "learning_rate": 9.876747876820705e-07, + "loss": 0.5382958889007569, + "step": 3445 + }, + { + "epoch": 0.09887653330276282, + "grad_norm": 24.18943422618106, + "learning_rate": 9.876235281354978e-07, + "loss": 0.5042176723480225, + "step": 3450 + }, + { + "epoch": 0.09901983262639, + "grad_norm": 20.809865356605297, + "learning_rate": 9.875721635536055e-07, + "loss": 0.5070887088775635, + "step": 3455 + }, + { + "epoch": 0.09916313195001719, + "grad_norm": 19.3467014443777, + "learning_rate": 9.875206939474575e-07, + "loss": 0.5397925853729248, + "step": 3460 + }, + { + "epoch": 0.09930643127364439, + "grad_norm": 21.957316659627903, + "learning_rate": 9.874691193281403e-07, + "loss": 0.476847505569458, + "step": 3465 + }, + { + "epoch": 0.09944973059727158, + "grad_norm": 25.05417488739938, + "learning_rate": 9.874174397067633e-07, + "loss": 0.5001289367675781, + "step": 3470 + }, + { + "epoch": 0.09959302992089877, + "grad_norm": 20.402470952180046, + "learning_rate": 9.873656550944589e-07, + "loss": 0.4968977928161621, + "step": 3475 + }, + { + "epoch": 0.09973632924452597, + "grad_norm": 16.20900969250893, + "learning_rate": 9.87313765502381e-07, + "loss": 0.5025802612304687, + "step": 3480 + }, + { + "epoch": 0.09987962856815316, + "grad_norm": 18.863723726371934, + "learning_rate": 9.87261770941707e-07, + "loss": 0.5090883255004883, + "step": 3485 + }, + { + "epoch": 0.10002292789178036, + "grad_norm": 21.04478175905767, + "learning_rate": 9.872096714236368e-07, + "loss": 0.4896389007568359, + "step": 3490 + }, + { + "epoch": 0.10016622721540755, + "grad_norm": 21.630405229143054, + "learning_rate": 9.871574669593924e-07, + "loss": 0.5102983951568604, + "step": 3495 + }, + { + "epoch": 0.10030952653903473, + "grad_norm": 19.980192748725116, + "learning_rate": 9.871051575602193e-07, + "loss": 0.4907646656036377, + "step": 3500 + }, + { + "epoch": 0.10045282586266192, + "grad_norm": 19.381817137225926, + "learning_rate": 9.870527432373846e-07, + "loss": 0.5036964416503906, + "step": 3505 + }, + { + "epoch": 0.10059612518628912, + "grad_norm": 22.664830179548783, + "learning_rate": 9.870002240021786e-07, + "loss": 0.5371236324310302, + "step": 3510 + }, + { + "epoch": 0.10073942450991631, + "grad_norm": 17.358238073169325, + "learning_rate": 9.869475998659142e-07, + "loss": 0.5007859706878662, + "step": 3515 + }, + { + "epoch": 0.1008827238335435, + "grad_norm": 13.626694506052864, + "learning_rate": 9.868948708399268e-07, + "loss": 0.4968564033508301, + "step": 3520 + }, + { + "epoch": 0.1010260231571707, + "grad_norm": 13.034418155726048, + "learning_rate": 9.86842036935574e-07, + "loss": 0.5062398910522461, + "step": 3525 + }, + { + "epoch": 0.1011693224807979, + "grad_norm": 16.517279463904952, + "learning_rate": 9.867890981642366e-07, + "loss": 0.5579112052917481, + "step": 3530 + }, + { + "epoch": 0.10131262180442509, + "grad_norm": 33.990024885705765, + "learning_rate": 9.86736054537318e-07, + "loss": 0.4968616008758545, + "step": 3535 + }, + { + "epoch": 0.10145592112805228, + "grad_norm": 23.7183836596022, + "learning_rate": 9.866829060662435e-07, + "loss": 0.48090319633483886, + "step": 3540 + }, + { + "epoch": 0.10159922045167946, + "grad_norm": 92.61966837398576, + "learning_rate": 9.866296527624616e-07, + "loss": 0.5060209274291992, + "step": 3545 + }, + { + "epoch": 0.10174251977530666, + "grad_norm": 23.525031538222503, + "learning_rate": 9.86576294637443e-07, + "loss": 0.5368023872375488, + "step": 3550 + }, + { + "epoch": 0.10188581909893385, + "grad_norm": 15.8894966485798, + "learning_rate": 9.865228317026817e-07, + "loss": 0.5261569499969483, + "step": 3555 + }, + { + "epoch": 0.10202911842256104, + "grad_norm": 28.81604699361697, + "learning_rate": 9.864692639696935e-07, + "loss": 0.5199954986572266, + "step": 3560 + }, + { + "epoch": 0.10217241774618824, + "grad_norm": 34.75048456698479, + "learning_rate": 9.864155914500164e-07, + "loss": 0.4960662841796875, + "step": 3565 + }, + { + "epoch": 0.10231571706981543, + "grad_norm": 53.715091292778574, + "learning_rate": 9.863618141552126e-07, + "loss": 0.5025854587554932, + "step": 3570 + }, + { + "epoch": 0.10245901639344263, + "grad_norm": 46.19668812817117, + "learning_rate": 9.863079320968652e-07, + "loss": 0.514333438873291, + "step": 3575 + }, + { + "epoch": 0.10260231571706982, + "grad_norm": 19.291937195917317, + "learning_rate": 9.862539452865808e-07, + "loss": 0.5403067111968994, + "step": 3580 + }, + { + "epoch": 0.10274561504069701, + "grad_norm": 26.392436765068705, + "learning_rate": 9.861998537359882e-07, + "loss": 0.5156404972076416, + "step": 3585 + }, + { + "epoch": 0.1028889143643242, + "grad_norm": 35.6206242571358, + "learning_rate": 9.861456574567387e-07, + "loss": 0.5340118885040284, + "step": 3590 + }, + { + "epoch": 0.10303221368795139, + "grad_norm": 20.92365110394907, + "learning_rate": 9.860913564605064e-07, + "loss": 0.5072038650512696, + "step": 3595 + }, + { + "epoch": 0.10317551301157858, + "grad_norm": 17.603054931068062, + "learning_rate": 9.860369507589883e-07, + "loss": 0.4995016098022461, + "step": 3600 + }, + { + "epoch": 0.10317551301157858, + "eval_bfov_iou": 0.7604577162414936, + "eval_bfov_iou@0.1": 0.976, + "eval_bfov_iou@0.25": 0.972, + "eval_bfov_iou@0.5": 0.968, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5205714285714286, + "eval_exact_match": 0.4105, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 369.1428, + "eval_samples_per_second": 5.418, + "eval_steps_per_second": 0.171, + "eval_task_acc_absolute_direction_mc": 0.808, + "eval_task_acc_camera_rotation_transform_mc": 0.288, + "eval_task_acc_object_conditioned_reorientation_mc": 0.356, + "eval_task_acc_observer_distance_choice": 0.576, + "eval_task_acc_relative_3d_position_mc": 0.524, + "eval_task_acc_relative_direction_mc": 0.396, + "eval_task_acc_seam_continuity_mc": 0.696, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7604577162414936, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 3600 + }, + { + "epoch": 0.10331881233520578, + "grad_norm": 19.481105353893412, + "learning_rate": 9.85982440363903e-07, + "loss": 0.520019817352295, + "step": 3605 + }, + { + "epoch": 0.10346211165883297, + "grad_norm": 22.86485013168239, + "learning_rate": 9.859278252869923e-07, + "loss": 0.5325165271759034, + "step": 3610 + }, + { + "epoch": 0.10360541098246016, + "grad_norm": 18.46341828693444, + "learning_rate": 9.858731055400205e-07, + "loss": 0.5026322364807129, + "step": 3615 + }, + { + "epoch": 0.10374871030608736, + "grad_norm": 14.853403268170345, + "learning_rate": 9.858182811347743e-07, + "loss": 0.5316049098968506, + "step": 3620 + }, + { + "epoch": 0.10389200962971455, + "grad_norm": 43.264210488345654, + "learning_rate": 9.85763352083063e-07, + "loss": 0.5207380294799805, + "step": 3625 + }, + { + "epoch": 0.10403530895334175, + "grad_norm": 24.49625682177483, + "learning_rate": 9.857083183967187e-07, + "loss": 0.5218274593353271, + "step": 3630 + }, + { + "epoch": 0.10417860827696893, + "grad_norm": 19.5143885634244, + "learning_rate": 9.856531800875954e-07, + "loss": 0.5232476234436035, + "step": 3635 + }, + { + "epoch": 0.10432190760059612, + "grad_norm": 46.958516165453794, + "learning_rate": 9.855979371675704e-07, + "loss": 0.5568093299865723, + "step": 3640 + }, + { + "epoch": 0.10446520692422331, + "grad_norm": 19.309248497584623, + "learning_rate": 9.855425896485428e-07, + "loss": 0.5101686477661133, + "step": 3645 + }, + { + "epoch": 0.10460850624785051, + "grad_norm": 22.25797045199054, + "learning_rate": 9.85487137542435e-07, + "loss": 0.5274618148803711, + "step": 3650 + }, + { + "epoch": 0.1047518055714777, + "grad_norm": 17.393424650229136, + "learning_rate": 9.85431580861191e-07, + "loss": 0.4943999290466309, + "step": 3655 + }, + { + "epoch": 0.1048951048951049, + "grad_norm": 32.74083186642051, + "learning_rate": 9.853759196167784e-07, + "loss": 0.5161127090454102, + "step": 3660 + }, + { + "epoch": 0.10503840421873209, + "grad_norm": 13.631629496213232, + "learning_rate": 9.853201538211864e-07, + "loss": 0.48990478515625, + "step": 3665 + }, + { + "epoch": 0.10518170354235928, + "grad_norm": 12.949972044105134, + "learning_rate": 9.852642834864274e-07, + "loss": 0.4852166175842285, + "step": 3670 + }, + { + "epoch": 0.10532500286598648, + "grad_norm": 20.049513930611074, + "learning_rate": 9.852083086245356e-07, + "loss": 0.5331484794616699, + "step": 3675 + }, + { + "epoch": 0.10546830218961367, + "grad_norm": 22.68927181423118, + "learning_rate": 9.851522292475684e-07, + "loss": 0.5623147010803222, + "step": 3680 + }, + { + "epoch": 0.10561160151324085, + "grad_norm": 21.682128134514375, + "learning_rate": 9.850960453676054e-07, + "loss": 0.4970057487487793, + "step": 3685 + }, + { + "epoch": 0.10575490083686805, + "grad_norm": 36.43988469963547, + "learning_rate": 9.850397569967487e-07, + "loss": 0.4905060291290283, + "step": 3690 + }, + { + "epoch": 0.10589820016049524, + "grad_norm": 19.74030113219953, + "learning_rate": 9.84983364147123e-07, + "loss": 0.5605355739593506, + "step": 3695 + }, + { + "epoch": 0.10604149948412243, + "grad_norm": 26.768588481040425, + "learning_rate": 9.849268668308755e-07, + "loss": 0.4853064060211182, + "step": 3700 + }, + { + "epoch": 0.10618479880774963, + "grad_norm": 21.103496077190815, + "learning_rate": 9.848702650601757e-07, + "loss": 0.5125981330871582, + "step": 3705 + }, + { + "epoch": 0.10632809813137682, + "grad_norm": 29.260142931276558, + "learning_rate": 9.84813558847216e-07, + "loss": 0.5003810882568359, + "step": 3710 + }, + { + "epoch": 0.10647139745500402, + "grad_norm": 14.687916049343256, + "learning_rate": 9.847567482042106e-07, + "loss": 0.5089735984802246, + "step": 3715 + }, + { + "epoch": 0.10661469677863121, + "grad_norm": 22.947764572190586, + "learning_rate": 9.846998331433974e-07, + "loss": 0.5038913726806641, + "step": 3720 + }, + { + "epoch": 0.1067579961022584, + "grad_norm": 17.928442122965837, + "learning_rate": 9.846428136770356e-07, + "loss": 0.47979888916015623, + "step": 3725 + }, + { + "epoch": 0.10690129542588558, + "grad_norm": 27.884077134611527, + "learning_rate": 9.84585689817407e-07, + "loss": 0.5264283180236816, + "step": 3730 + }, + { + "epoch": 0.10704459474951278, + "grad_norm": 14.342012649577129, + "learning_rate": 9.845284615768168e-07, + "loss": 0.5046662330627442, + "step": 3735 + }, + { + "epoch": 0.10718789407313997, + "grad_norm": 21.954304910365014, + "learning_rate": 9.84471128967592e-07, + "loss": 0.5011909484863282, + "step": 3740 + }, + { + "epoch": 0.10733119339676717, + "grad_norm": 17.097834212988705, + "learning_rate": 9.844136920020818e-07, + "loss": 0.5196532249450684, + "step": 3745 + }, + { + "epoch": 0.10747449272039436, + "grad_norm": 37.1800260794283, + "learning_rate": 9.843561506926587e-07, + "loss": 0.5050465106964112, + "step": 3750 + }, + { + "epoch": 0.10761779204402155, + "grad_norm": 14.318984541838857, + "learning_rate": 9.84298505051717e-07, + "loss": 0.4876245498657227, + "step": 3755 + }, + { + "epoch": 0.10776109136764875, + "grad_norm": 27.558385461820713, + "learning_rate": 9.842407550916741e-07, + "loss": 0.5230881214141846, + "step": 3760 + }, + { + "epoch": 0.10790439069127594, + "grad_norm": 16.966224817612964, + "learning_rate": 9.841829008249689e-07, + "loss": 0.5239606380462647, + "step": 3765 + }, + { + "epoch": 0.10804769001490314, + "grad_norm": 24.525273784344332, + "learning_rate": 9.841249422640637e-07, + "loss": 0.5625698566436768, + "step": 3770 + }, + { + "epoch": 0.10819098933853032, + "grad_norm": 17.915784618880572, + "learning_rate": 9.840668794214428e-07, + "loss": 0.4998626708984375, + "step": 3775 + }, + { + "epoch": 0.10833428866215751, + "grad_norm": 24.974926742670245, + "learning_rate": 9.84008712309613e-07, + "loss": 0.4878023624420166, + "step": 3780 + }, + { + "epoch": 0.1084775879857847, + "grad_norm": 34.717927627884706, + "learning_rate": 9.83950440941104e-07, + "loss": 0.4741241455078125, + "step": 3785 + }, + { + "epoch": 0.1086208873094119, + "grad_norm": 29.952785223221564, + "learning_rate": 9.838920653284674e-07, + "loss": 0.5071943283081055, + "step": 3790 + }, + { + "epoch": 0.10876418663303909, + "grad_norm": 15.210905179763898, + "learning_rate": 9.838335854842773e-07, + "loss": 0.4880509376525879, + "step": 3795 + }, + { + "epoch": 0.10890748595666629, + "grad_norm": 19.74499023270051, + "learning_rate": 9.837750014211307e-07, + "loss": 0.47911605834960935, + "step": 3800 + }, + { + "epoch": 0.10905078528029348, + "grad_norm": 23.794928066808925, + "learning_rate": 9.837163131516462e-07, + "loss": 0.5184255599975586, + "step": 3805 + }, + { + "epoch": 0.10919408460392067, + "grad_norm": 21.829168108260525, + "learning_rate": 9.836575206884661e-07, + "loss": 0.49016518592834474, + "step": 3810 + }, + { + "epoch": 0.10933738392754787, + "grad_norm": 41.03725033355982, + "learning_rate": 9.83598624044254e-07, + "loss": 0.5124398708343506, + "step": 3815 + }, + { + "epoch": 0.10948068325117505, + "grad_norm": 49.90752269248704, + "learning_rate": 9.835396232316964e-07, + "loss": 0.5034698963165283, + "step": 3820 + }, + { + "epoch": 0.10962398257480224, + "grad_norm": 17.965901362678277, + "learning_rate": 9.834805182635025e-07, + "loss": 0.5142681121826171, + "step": 3825 + }, + { + "epoch": 0.10976728189842944, + "grad_norm": 22.89205235318075, + "learning_rate": 9.834213091524033e-07, + "loss": 0.5366620063781739, + "step": 3830 + }, + { + "epoch": 0.10991058122205663, + "grad_norm": 21.96056151834303, + "learning_rate": 9.83361995911153e-07, + "loss": 0.5027626991271973, + "step": 3835 + }, + { + "epoch": 0.11005388054568382, + "grad_norm": 22.883237748279647, + "learning_rate": 9.833025785525274e-07, + "loss": 0.49997987747192385, + "step": 3840 + }, + { + "epoch": 0.11019717986931102, + "grad_norm": 15.552561166807799, + "learning_rate": 9.832430570893255e-07, + "loss": 0.5252890586853027, + "step": 3845 + }, + { + "epoch": 0.11034047919293821, + "grad_norm": 19.579575965218673, + "learning_rate": 9.831834315343682e-07, + "loss": 0.4912266254425049, + "step": 3850 + }, + { + "epoch": 0.1104837785165654, + "grad_norm": 18.846390012576084, + "learning_rate": 9.831237019004988e-07, + "loss": 0.4729150295257568, + "step": 3855 + }, + { + "epoch": 0.1106270778401926, + "grad_norm": 19.843077392473145, + "learning_rate": 9.830638682005837e-07, + "loss": 0.5415653705596923, + "step": 3860 + }, + { + "epoch": 0.11077037716381978, + "grad_norm": 17.35187593772947, + "learning_rate": 9.830039304475106e-07, + "loss": 0.5045701026916504, + "step": 3865 + }, + { + "epoch": 0.11091367648744697, + "grad_norm": 26.57131442135705, + "learning_rate": 9.829438886541908e-07, + "loss": 0.4952863693237305, + "step": 3870 + }, + { + "epoch": 0.11105697581107417, + "grad_norm": 16.40767488374686, + "learning_rate": 9.828837428335573e-07, + "loss": 0.5424654960632325, + "step": 3875 + }, + { + "epoch": 0.11120027513470136, + "grad_norm": 19.789604384488623, + "learning_rate": 9.828234929985655e-07, + "loss": 0.5189991950988769, + "step": 3880 + }, + { + "epoch": 0.11134357445832856, + "grad_norm": 31.872327346706424, + "learning_rate": 9.827631391621934e-07, + "loss": 0.484393310546875, + "step": 3885 + }, + { + "epoch": 0.11148687378195575, + "grad_norm": 14.866887096830244, + "learning_rate": 9.827026813374414e-07, + "loss": 0.5076639652252197, + "step": 3890 + }, + { + "epoch": 0.11163017310558294, + "grad_norm": 27.31536172219596, + "learning_rate": 9.826421195373324e-07, + "loss": 0.5379841804504395, + "step": 3895 + }, + { + "epoch": 0.11177347242921014, + "grad_norm": 23.871735516817694, + "learning_rate": 9.825814537749114e-07, + "loss": 0.5000497817993164, + "step": 3900 + }, + { + "epoch": 0.11177347242921014, + "eval_bfov_iou": 0.7773062586405984, + "eval_bfov_iou@0.1": 0.968, + "eval_bfov_iou@0.25": 0.96, + "eval_bfov_iou@0.5": 0.96, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5085714285714286, + "eval_exact_match": 0.4145, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 342.2707, + "eval_samples_per_second": 5.843, + "eval_steps_per_second": 0.184, + "eval_task_acc_absolute_direction_mc": 0.74, + "eval_task_acc_camera_rotation_transform_mc": 0.292, + "eval_task_acc_object_conditioned_reorientation_mc": 0.336, + "eval_task_acc_observer_distance_choice": 0.616, + "eval_task_acc_relative_3d_position_mc": 0.516, + "eval_task_acc_relative_direction_mc": 0.404, + "eval_task_acc_seam_continuity_mc": 0.656, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7773062586405984, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 3900 + }, + { + "epoch": 0.11191677175283733, + "grad_norm": 28.82195678465451, + "learning_rate": 9.82520684063246e-07, + "loss": 0.5284539222717285, + "step": 3905 + }, + { + "epoch": 0.11206007107646451, + "grad_norm": 17.270195456978694, + "learning_rate": 9.82459810415426e-07, + "loss": 0.49328389167785647, + "step": 3910 + }, + { + "epoch": 0.1122033704000917, + "grad_norm": 13.401310357731699, + "learning_rate": 9.823988328445642e-07, + "loss": 0.4924570083618164, + "step": 3915 + }, + { + "epoch": 0.1123466697237189, + "grad_norm": 24.919222176915998, + "learning_rate": 9.823377513637949e-07, + "loss": 0.5204029560089112, + "step": 3920 + }, + { + "epoch": 0.1124899690473461, + "grad_norm": 17.22046345604967, + "learning_rate": 9.822765659862751e-07, + "loss": 0.53695650100708, + "step": 3925 + }, + { + "epoch": 0.11263326837097329, + "grad_norm": 13.179214716980288, + "learning_rate": 9.822152767251847e-07, + "loss": 0.5094770431518555, + "step": 3930 + }, + { + "epoch": 0.11277656769460048, + "grad_norm": 13.711117819633424, + "learning_rate": 9.821538835937254e-07, + "loss": 0.493761682510376, + "step": 3935 + }, + { + "epoch": 0.11291986701822768, + "grad_norm": 15.769294690749037, + "learning_rate": 9.820923866051212e-07, + "loss": 0.5089295387268067, + "step": 3940 + }, + { + "epoch": 0.11306316634185487, + "grad_norm": 13.332501805353614, + "learning_rate": 9.82030785772619e-07, + "loss": 0.49037466049194334, + "step": 3945 + }, + { + "epoch": 0.11320646566548206, + "grad_norm": 34.12594214766252, + "learning_rate": 9.819690811094875e-07, + "loss": 0.5124929428100586, + "step": 3950 + }, + { + "epoch": 0.11334976498910924, + "grad_norm": 19.786691286670067, + "learning_rate": 9.819072726290185e-07, + "loss": 0.491590690612793, + "step": 3955 + }, + { + "epoch": 0.11349306431273644, + "grad_norm": 17.926786916691942, + "learning_rate": 9.818453603445252e-07, + "loss": 0.5123805046081543, + "step": 3960 + }, + { + "epoch": 0.11363636363636363, + "grad_norm": 32.9681478140541, + "learning_rate": 9.81783344269344e-07, + "loss": 0.5080521106719971, + "step": 3965 + }, + { + "epoch": 0.11377966295999083, + "grad_norm": 14.725129224277513, + "learning_rate": 9.817212244168331e-07, + "loss": 0.4962045192718506, + "step": 3970 + }, + { + "epoch": 0.11392296228361802, + "grad_norm": 17.371084839017456, + "learning_rate": 9.816590008003733e-07, + "loss": 0.5268577575683594, + "step": 3975 + }, + { + "epoch": 0.11406626160724521, + "grad_norm": 15.266244638127992, + "learning_rate": 9.815966734333678e-07, + "loss": 0.5484256744384766, + "step": 3980 + }, + { + "epoch": 0.11420956093087241, + "grad_norm": 12.591491413290875, + "learning_rate": 9.81534242329242e-07, + "loss": 0.5226043224334717, + "step": 3985 + }, + { + "epoch": 0.1143528602544996, + "grad_norm": 13.171087349279286, + "learning_rate": 9.814717075014437e-07, + "loss": 0.4949751377105713, + "step": 3990 + }, + { + "epoch": 0.1144961595781268, + "grad_norm": 22.115929673383757, + "learning_rate": 9.814090689634433e-07, + "loss": 0.4821035385131836, + "step": 3995 + }, + { + "epoch": 0.11463945890175399, + "grad_norm": 16.369754146329658, + "learning_rate": 9.813463267287329e-07, + "loss": 0.5143351554870605, + "step": 4000 + }, + { + "epoch": 0.11478275822538117, + "grad_norm": 18.30573871503357, + "learning_rate": 9.812834808108278e-07, + "loss": 0.5114687919616699, + "step": 4005 + }, + { + "epoch": 0.11492605754900836, + "grad_norm": 15.30405321861601, + "learning_rate": 9.812205312232648e-07, + "loss": 0.5113118171691895, + "step": 4010 + }, + { + "epoch": 0.11506935687263556, + "grad_norm": 14.247489991668818, + "learning_rate": 9.811574779796034e-07, + "loss": 0.5047449111938477, + "step": 4015 + }, + { + "epoch": 0.11521265619626275, + "grad_norm": 56.12927094982484, + "learning_rate": 9.810943210934257e-07, + "loss": 0.4744846343994141, + "step": 4020 + }, + { + "epoch": 0.11535595551988995, + "grad_norm": 19.08962915152303, + "learning_rate": 9.810310605783355e-07, + "loss": 0.4914724349975586, + "step": 4025 + }, + { + "epoch": 0.11549925484351714, + "grad_norm": 19.582136110221064, + "learning_rate": 9.809676964479594e-07, + "loss": 0.4643186092376709, + "step": 4030 + }, + { + "epoch": 0.11564255416714433, + "grad_norm": 53.00684988011477, + "learning_rate": 9.809042287159466e-07, + "loss": 0.5125024795532227, + "step": 4035 + }, + { + "epoch": 0.11578585349077153, + "grad_norm": 23.615586899488964, + "learning_rate": 9.808406573959676e-07, + "loss": 0.5415911674499512, + "step": 4040 + }, + { + "epoch": 0.11592915281439872, + "grad_norm": 13.707361270377246, + "learning_rate": 9.80776982501716e-07, + "loss": 0.5277876377105712, + "step": 4045 + }, + { + "epoch": 0.1160724521380259, + "grad_norm": 26.354120351606017, + "learning_rate": 9.807132040469077e-07, + "loss": 0.5098046779632568, + "step": 4050 + }, + { + "epoch": 0.1162157514616531, + "grad_norm": 16.077446678169487, + "learning_rate": 9.806493220452806e-07, + "loss": 0.49621992111206054, + "step": 4055 + }, + { + "epoch": 0.11635905078528029, + "grad_norm": 13.375480048956948, + "learning_rate": 9.805853365105952e-07, + "loss": 0.5093412876129151, + "step": 4060 + }, + { + "epoch": 0.11650235010890748, + "grad_norm": 16.66799801141065, + "learning_rate": 9.80521247456634e-07, + "loss": 0.4902738094329834, + "step": 4065 + }, + { + "epoch": 0.11664564943253468, + "grad_norm": 22.60080297643987, + "learning_rate": 9.80457054897202e-07, + "loss": 0.4709005355834961, + "step": 4070 + }, + { + "epoch": 0.11678894875616187, + "grad_norm": 18.305916274810983, + "learning_rate": 9.803927588461264e-07, + "loss": 0.4913516044616699, + "step": 4075 + }, + { + "epoch": 0.11693224807978907, + "grad_norm": 26.542500594039698, + "learning_rate": 9.803283593172564e-07, + "loss": 0.49268312454223634, + "step": 4080 + }, + { + "epoch": 0.11707554740341626, + "grad_norm": 13.57386199724532, + "learning_rate": 9.802638563244646e-07, + "loss": 0.5074368000030518, + "step": 4085 + }, + { + "epoch": 0.11721884672704345, + "grad_norm": 14.279023761659078, + "learning_rate": 9.801992498816443e-07, + "loss": 0.48483691215515134, + "step": 4090 + }, + { + "epoch": 0.11736214605067063, + "grad_norm": 45.61185401883648, + "learning_rate": 9.801345400027125e-07, + "loss": 0.49082159996032715, + "step": 4095 + }, + { + "epoch": 0.11750544537429783, + "grad_norm": 13.624034799166594, + "learning_rate": 9.800697267016076e-07, + "loss": 0.4942619323730469, + "step": 4100 + }, + { + "epoch": 0.11764874469792502, + "grad_norm": 33.33056846164641, + "learning_rate": 9.800048099922903e-07, + "loss": 0.5128925323486329, + "step": 4105 + }, + { + "epoch": 0.11779204402155222, + "grad_norm": 33.79540465497044, + "learning_rate": 9.799397898887442e-07, + "loss": 0.49074177742004393, + "step": 4110 + }, + { + "epoch": 0.11793534334517941, + "grad_norm": 25.184939789157823, + "learning_rate": 9.798746664049749e-07, + "loss": 0.5394467830657959, + "step": 4115 + }, + { + "epoch": 0.1180786426688066, + "grad_norm": 12.719614929989694, + "learning_rate": 9.798094395550096e-07, + "loss": 0.5310544013977051, + "step": 4120 + }, + { + "epoch": 0.1182219419924338, + "grad_norm": 15.449433255431309, + "learning_rate": 9.797441093528988e-07, + "loss": 0.5172051906585693, + "step": 4125 + }, + { + "epoch": 0.11836524131606099, + "grad_norm": 23.162205522089113, + "learning_rate": 9.796786758127147e-07, + "loss": 0.5099551200866699, + "step": 4130 + }, + { + "epoch": 0.11850854063968819, + "grad_norm": 11.659767291474235, + "learning_rate": 9.796131389485519e-07, + "loss": 0.47780523300170896, + "step": 4135 + }, + { + "epoch": 0.11865183996331537, + "grad_norm": 16.289539087790505, + "learning_rate": 9.79547498774527e-07, + "loss": 0.5195588111877442, + "step": 4140 + }, + { + "epoch": 0.11879513928694256, + "grad_norm": 56.69117001649127, + "learning_rate": 9.794817553047789e-07, + "loss": 0.4617317199707031, + "step": 4145 + }, + { + "epoch": 0.11893843861056975, + "grad_norm": 16.960332798570402, + "learning_rate": 9.794159085534695e-07, + "loss": 0.5002500057220459, + "step": 4150 + }, + { + "epoch": 0.11908173793419695, + "grad_norm": 20.539985248097118, + "learning_rate": 9.79349958534782e-07, + "loss": 0.48713130950927735, + "step": 4155 + }, + { + "epoch": 0.11922503725782414, + "grad_norm": 20.937088850106004, + "learning_rate": 9.792839052629218e-07, + "loss": 0.5202593803405762, + "step": 4160 + }, + { + "epoch": 0.11936833658145134, + "grad_norm": 24.547091627541924, + "learning_rate": 9.79217748752118e-07, + "loss": 0.5125520706176758, + "step": 4165 + }, + { + "epoch": 0.11951163590507853, + "grad_norm": 12.782009866029117, + "learning_rate": 9.791514890166196e-07, + "loss": 0.4814730644226074, + "step": 4170 + }, + { + "epoch": 0.11965493522870572, + "grad_norm": 18.861023234398978, + "learning_rate": 9.790851260707e-07, + "loss": 0.5317799568176269, + "step": 4175 + }, + { + "epoch": 0.11979823455233292, + "grad_norm": 18.848943951439697, + "learning_rate": 9.790186599286538e-07, + "loss": 0.530681037902832, + "step": 4180 + }, + { + "epoch": 0.1199415338759601, + "grad_norm": 18.232303506895324, + "learning_rate": 9.789520906047977e-07, + "loss": 0.4832651138305664, + "step": 4185 + }, + { + "epoch": 0.1200848331995873, + "grad_norm": 20.906739061905945, + "learning_rate": 9.788854181134712e-07, + "loss": 0.4830461025238037, + "step": 4190 + }, + { + "epoch": 0.12022813252321449, + "grad_norm": 23.290065832156266, + "learning_rate": 9.788186424690355e-07, + "loss": 0.5312097549438477, + "step": 4195 + }, + { + "epoch": 0.12037143184684168, + "grad_norm": 26.421985350008597, + "learning_rate": 9.787517636858742e-07, + "loss": 0.4817045211791992, + "step": 4200 + }, + { + "epoch": 0.12037143184684168, + "eval_bfov_iou": 0.7909349367234251, + "eval_bfov_iou@0.1": 0.976, + "eval_bfov_iou@0.25": 0.972, + "eval_bfov_iou@0.5": 0.964, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5394285714285715, + "eval_exact_match": 0.353, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 376.265, + "eval_samples_per_second": 5.315, + "eval_steps_per_second": 0.167, + "eval_task_acc_absolute_direction_mc": 0.848, + "eval_task_acc_camera_rotation_transform_mc": 0.288, + "eval_task_acc_object_conditioned_reorientation_mc": 0.364, + "eval_task_acc_observer_distance_choice": 0.572, + "eval_task_acc_relative_3d_position_mc": 0.544, + "eval_task_acc_relative_direction_mc": 0.428, + "eval_task_acc_seam_continuity_mc": 0.732, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.964, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7909349367234251, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 4200 + }, + { + "epoch": 0.12051473117046888, + "grad_norm": 18.057188677131254, + "learning_rate": 9.786847817783932e-07, + "loss": 0.4972041606903076, + "step": 4205 + }, + { + "epoch": 0.12065803049409607, + "grad_norm": 11.564609351615642, + "learning_rate": 9.786176967610208e-07, + "loss": 0.47958030700683596, + "step": 4210 + }, + { + "epoch": 0.12080132981772326, + "grad_norm": 19.20904972610022, + "learning_rate": 9.785505086482073e-07, + "loss": 0.5101867198944092, + "step": 4215 + }, + { + "epoch": 0.12094462914135046, + "grad_norm": 23.639694756209003, + "learning_rate": 9.784832174544247e-07, + "loss": 0.5132323265075683, + "step": 4220 + }, + { + "epoch": 0.12108792846497765, + "grad_norm": 25.657730516721745, + "learning_rate": 9.784158231941683e-07, + "loss": 0.5459356307983398, + "step": 4225 + }, + { + "epoch": 0.12123122778860483, + "grad_norm": 70.73406324692706, + "learning_rate": 9.783483258819543e-07, + "loss": 0.49274349212646484, + "step": 4230 + }, + { + "epoch": 0.12137452711223203, + "grad_norm": 18.728709797284957, + "learning_rate": 9.782807255323224e-07, + "loss": 0.5253486633300781, + "step": 4235 + }, + { + "epoch": 0.12151782643585922, + "grad_norm": 21.63756157240776, + "learning_rate": 9.782130221598334e-07, + "loss": 0.46839132308959963, + "step": 4240 + }, + { + "epoch": 0.12166112575948641, + "grad_norm": 29.03728784105589, + "learning_rate": 9.781452157790715e-07, + "loss": 0.48889880180358886, + "step": 4245 + }, + { + "epoch": 0.12180442508311361, + "grad_norm": 23.20642421613957, + "learning_rate": 9.780773064046415e-07, + "loss": 0.5113687515258789, + "step": 4250 + }, + { + "epoch": 0.1219477244067408, + "grad_norm": 21.273658944417285, + "learning_rate": 9.780092940511718e-07, + "loss": 0.5189097404479981, + "step": 4255 + }, + { + "epoch": 0.122091023730368, + "grad_norm": 19.69625450680951, + "learning_rate": 9.779411787333123e-07, + "loss": 0.48878931999206543, + "step": 4260 + }, + { + "epoch": 0.12223432305399519, + "grad_norm": 25.28313707367948, + "learning_rate": 9.778729604657353e-07, + "loss": 0.5210617542266845, + "step": 4265 + }, + { + "epoch": 0.12237762237762238, + "grad_norm": 22.91045398031361, + "learning_rate": 9.778046392631348e-07, + "loss": 0.4933749198913574, + "step": 4270 + }, + { + "epoch": 0.12252092170124956, + "grad_norm": 18.348879939038067, + "learning_rate": 9.777362151402277e-07, + "loss": 0.48871479034423826, + "step": 4275 + }, + { + "epoch": 0.12266422102487676, + "grad_norm": 45.30152328875519, + "learning_rate": 9.776676881117527e-07, + "loss": 0.487711763381958, + "step": 4280 + }, + { + "epoch": 0.12280752034850395, + "grad_norm": 23.86475899237234, + "learning_rate": 9.775990581924706e-07, + "loss": 0.5172350406646729, + "step": 4285 + }, + { + "epoch": 0.12295081967213115, + "grad_norm": 15.269565141248092, + "learning_rate": 9.775303253971646e-07, + "loss": 0.4784417152404785, + "step": 4290 + }, + { + "epoch": 0.12309411899575834, + "grad_norm": 19.11506890694992, + "learning_rate": 9.774614897406396e-07, + "loss": 0.48580150604248046, + "step": 4295 + }, + { + "epoch": 0.12323741831938553, + "grad_norm": 16.38069521851006, + "learning_rate": 9.773925512377233e-07, + "loss": 0.481754207611084, + "step": 4300 + }, + { + "epoch": 0.12338071764301273, + "grad_norm": 14.4992151252462, + "learning_rate": 9.773235099032651e-07, + "loss": 0.5069381713867187, + "step": 4305 + }, + { + "epoch": 0.12352401696663992, + "grad_norm": 17.409243762046863, + "learning_rate": 9.772543657521368e-07, + "loss": 0.5002931594848633, + "step": 4310 + }, + { + "epoch": 0.12366731629026712, + "grad_norm": 16.435374205545223, + "learning_rate": 9.771851187992319e-07, + "loss": 0.5187475204467773, + "step": 4315 + }, + { + "epoch": 0.12381061561389431, + "grad_norm": 20.490124674716956, + "learning_rate": 9.771157690594666e-07, + "loss": 0.5086021423339844, + "step": 4320 + }, + { + "epoch": 0.12395391493752149, + "grad_norm": 24.047643200914553, + "learning_rate": 9.770463165477792e-07, + "loss": 0.5026821613311767, + "step": 4325 + }, + { + "epoch": 0.12409721426114868, + "grad_norm": 13.827300630011202, + "learning_rate": 9.769767612791296e-07, + "loss": 0.5192001342773438, + "step": 4330 + }, + { + "epoch": 0.12424051358477588, + "grad_norm": 12.593014949304044, + "learning_rate": 9.769071032685e-07, + "loss": 0.5065165519714355, + "step": 4335 + }, + { + "epoch": 0.12438381290840307, + "grad_norm": 11.559341843942319, + "learning_rate": 9.768373425308957e-07, + "loss": 0.5076734542846679, + "step": 4340 + }, + { + "epoch": 0.12452711223203027, + "grad_norm": 20.412983521818415, + "learning_rate": 9.767674790813425e-07, + "loss": 0.5083989143371582, + "step": 4345 + }, + { + "epoch": 0.12467041155565746, + "grad_norm": 56.13403339250387, + "learning_rate": 9.766975129348897e-07, + "loss": 0.5325092315673828, + "step": 4350 + }, + { + "epoch": 0.12481371087928465, + "grad_norm": 16.610067438207082, + "learning_rate": 9.76627444106608e-07, + "loss": 0.5078094482421875, + "step": 4355 + }, + { + "epoch": 0.12495701020291185, + "grad_norm": 11.473689429258457, + "learning_rate": 9.7655727261159e-07, + "loss": 0.502854585647583, + "step": 4360 + }, + { + "epoch": 0.12510030952653903, + "grad_norm": 29.14122765481463, + "learning_rate": 9.764869984649516e-07, + "loss": 0.5060647010803223, + "step": 4365 + }, + { + "epoch": 0.12524360885016622, + "grad_norm": 22.14695101664338, + "learning_rate": 9.764166216818297e-07, + "loss": 0.49750146865844724, + "step": 4370 + }, + { + "epoch": 0.12538690817379342, + "grad_norm": 12.125076464574569, + "learning_rate": 9.763461422773833e-07, + "loss": 0.5144474029541015, + "step": 4375 + }, + { + "epoch": 0.1255302074974206, + "grad_norm": 15.7459984917081, + "learning_rate": 9.76275560266794e-07, + "loss": 0.5396691799163819, + "step": 4380 + }, + { + "epoch": 0.1256735068210478, + "grad_norm": 17.83066381824016, + "learning_rate": 9.762048756652657e-07, + "loss": 0.5434780120849609, + "step": 4385 + }, + { + "epoch": 0.125816806144675, + "grad_norm": 10.070995889870613, + "learning_rate": 9.761340884880238e-07, + "loss": 0.4675254821777344, + "step": 4390 + }, + { + "epoch": 0.1259601054683022, + "grad_norm": 13.53367345493382, + "learning_rate": 9.76063198750316e-07, + "loss": 0.5256925582885742, + "step": 4395 + }, + { + "epoch": 0.12610340479192939, + "grad_norm": 27.90982250896573, + "learning_rate": 9.759922064674118e-07, + "loss": 0.5096074104309082, + "step": 4400 + }, + { + "epoch": 0.12624670411555658, + "grad_norm": 17.57061502223891, + "learning_rate": 9.759211116546039e-07, + "loss": 0.4949976921081543, + "step": 4405 + }, + { + "epoch": 0.12639000343918377, + "grad_norm": 30.837132777186252, + "learning_rate": 9.758499143272055e-07, + "loss": 0.505458927154541, + "step": 4410 + }, + { + "epoch": 0.12653330276281097, + "grad_norm": 16.400889210499912, + "learning_rate": 9.75778614500553e-07, + "loss": 0.4983267307281494, + "step": 4415 + }, + { + "epoch": 0.12667660208643816, + "grad_norm": 15.068856225186671, + "learning_rate": 9.757072121900049e-07, + "loss": 0.516080379486084, + "step": 4420 + }, + { + "epoch": 0.12681990141006536, + "grad_norm": 14.601558567899362, + "learning_rate": 9.756357074109409e-07, + "loss": 0.5046076297760009, + "step": 4425 + }, + { + "epoch": 0.12696320073369255, + "grad_norm": 30.726164915668207, + "learning_rate": 9.755641001787636e-07, + "loss": 0.5310994148254394, + "step": 4430 + }, + { + "epoch": 0.12710650005731972, + "grad_norm": 35.374831874575236, + "learning_rate": 9.754923905088973e-07, + "loss": 0.4986581802368164, + "step": 4435 + }, + { + "epoch": 0.1272497993809469, + "grad_norm": 45.32289613084723, + "learning_rate": 9.754205784167886e-07, + "loss": 0.509913444519043, + "step": 4440 + }, + { + "epoch": 0.1273930987045741, + "grad_norm": 14.62741741033143, + "learning_rate": 9.753486639179057e-07, + "loss": 0.48914461135864257, + "step": 4445 + }, + { + "epoch": 0.1275363980282013, + "grad_norm": 22.683773301972842, + "learning_rate": 9.752766470277394e-07, + "loss": 0.5213032722473144, + "step": 4450 + }, + { + "epoch": 0.1276796973518285, + "grad_norm": 21.96102069268189, + "learning_rate": 9.752045277618022e-07, + "loss": 0.4965799331665039, + "step": 4455 + }, + { + "epoch": 0.12782299667545569, + "grad_norm": 47.23811503710038, + "learning_rate": 9.751323061356287e-07, + "loss": 0.4983967781066895, + "step": 4460 + }, + { + "epoch": 0.12796629599908288, + "grad_norm": 29.742628752018977, + "learning_rate": 9.750599821647757e-07, + "loss": 0.5199332714080811, + "step": 4465 + }, + { + "epoch": 0.12810959532271007, + "grad_norm": 36.774203216105754, + "learning_rate": 9.749875558648222e-07, + "loss": 0.488204288482666, + "step": 4470 + }, + { + "epoch": 0.12825289464633727, + "grad_norm": 15.732139177912495, + "learning_rate": 9.749150272513686e-07, + "loss": 0.5302542686462403, + "step": 4475 + }, + { + "epoch": 0.12839619396996446, + "grad_norm": 29.594270777551223, + "learning_rate": 9.74842396340038e-07, + "loss": 0.5332390785217285, + "step": 4480 + }, + { + "epoch": 0.12853949329359166, + "grad_norm": 45.04957416312055, + "learning_rate": 9.747696631464752e-07, + "loss": 0.4826493263244629, + "step": 4485 + }, + { + "epoch": 0.12868279261721885, + "grad_norm": 16.13021765946701, + "learning_rate": 9.746968276863472e-07, + "loss": 0.5105721473693847, + "step": 4490 + }, + { + "epoch": 0.12882609194084604, + "grad_norm": 23.80936869116072, + "learning_rate": 9.746238899753427e-07, + "loss": 0.5006115436553955, + "step": 4495 + }, + { + "epoch": 0.12896939126447324, + "grad_norm": 24.982974196025705, + "learning_rate": 9.745508500291728e-07, + "loss": 0.4822225093841553, + "step": 4500 + }, + { + "epoch": 0.12896939126447324, + "eval_bfov_iou": 0.7996624037660007, + "eval_bfov_iou@0.1": 0.976, + "eval_bfov_iou@0.25": 0.976, + "eval_bfov_iou@0.5": 0.976, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5514285714285714, + "eval_exact_match": 0.3405, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 371.7399, + "eval_samples_per_second": 5.38, + "eval_steps_per_second": 0.169, + "eval_task_acc_absolute_direction_mc": 0.852, + "eval_task_acc_camera_rotation_transform_mc": 0.272, + "eval_task_acc_object_conditioned_reorientation_mc": 0.392, + "eval_task_acc_observer_distance_choice": 0.608, + "eval_task_acc_relative_3d_position_mc": 0.568, + "eval_task_acc_relative_direction_mc": 0.48, + "eval_task_acc_seam_continuity_mc": 0.688, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7996624037660007, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 4500 + }, + { + "epoch": 0.12911269058810043, + "grad_norm": 17.154513844751147, + "learning_rate": 9.744777078635707e-07, + "loss": 0.4886470794677734, + "step": 4505 + }, + { + "epoch": 0.12925598991172763, + "grad_norm": 17.701584572153333, + "learning_rate": 9.74404463494291e-07, + "loss": 0.4812470436096191, + "step": 4510 + }, + { + "epoch": 0.12939928923535482, + "grad_norm": 39.2006692141387, + "learning_rate": 9.743311169371112e-07, + "loss": 0.5054436683654785, + "step": 4515 + }, + { + "epoch": 0.129542588558982, + "grad_norm": 27.24093639831892, + "learning_rate": 9.7425766820783e-07, + "loss": 0.5407980918884278, + "step": 4520 + }, + { + "epoch": 0.1296858878826092, + "grad_norm": 11.483254392925035, + "learning_rate": 9.741841173222685e-07, + "loss": 0.4838881492614746, + "step": 4525 + }, + { + "epoch": 0.12982918720623637, + "grad_norm": 16.72990365662461, + "learning_rate": 9.741104642962696e-07, + "loss": 0.462264347076416, + "step": 4530 + }, + { + "epoch": 0.12997248652986357, + "grad_norm": 22.141238414577803, + "learning_rate": 9.740367091456985e-07, + "loss": 0.5117775917053222, + "step": 4535 + }, + { + "epoch": 0.13011578585349076, + "grad_norm": 15.337907230151824, + "learning_rate": 9.739628518864424e-07, + "loss": 0.5028968811035156, + "step": 4540 + }, + { + "epoch": 0.13025908517711796, + "grad_norm": 23.2814928947381, + "learning_rate": 9.7388889253441e-07, + "loss": 0.4743380546569824, + "step": 4545 + }, + { + "epoch": 0.13040238450074515, + "grad_norm": 21.518869984713245, + "learning_rate": 9.738148311055325e-07, + "loss": 0.46238031387329104, + "step": 4550 + }, + { + "epoch": 0.13054568382437234, + "grad_norm": 19.524287696988225, + "learning_rate": 9.737406676157632e-07, + "loss": 0.5396129131317139, + "step": 4555 + }, + { + "epoch": 0.13068898314799954, + "grad_norm": 14.03434951859181, + "learning_rate": 9.736664020810765e-07, + "loss": 0.526594877243042, + "step": 4560 + }, + { + "epoch": 0.13083228247162673, + "grad_norm": 21.363034827585434, + "learning_rate": 9.735920345174698e-07, + "loss": 0.5101262092590332, + "step": 4565 + }, + { + "epoch": 0.13097558179525393, + "grad_norm": 16.96439864448951, + "learning_rate": 9.73517564940962e-07, + "loss": 0.4964465141296387, + "step": 4570 + }, + { + "epoch": 0.13111888111888112, + "grad_norm": 37.52402714567032, + "learning_rate": 9.734429933675937e-07, + "loss": 0.5168231010437012, + "step": 4575 + }, + { + "epoch": 0.1312621804425083, + "grad_norm": 14.140816309408445, + "learning_rate": 9.733683198134284e-07, + "loss": 0.46343770027160647, + "step": 4580 + }, + { + "epoch": 0.1314054797661355, + "grad_norm": 15.27257905898339, + "learning_rate": 9.732935442945508e-07, + "loss": 0.4847858905792236, + "step": 4585 + }, + { + "epoch": 0.1315487790897627, + "grad_norm": 23.770957074218845, + "learning_rate": 9.732186668270671e-07, + "loss": 0.4813075542449951, + "step": 4590 + }, + { + "epoch": 0.1316920784133899, + "grad_norm": 17.70649112198561, + "learning_rate": 9.731436874271069e-07, + "loss": 0.5111162185668945, + "step": 4595 + }, + { + "epoch": 0.1318353777370171, + "grad_norm": 13.531152951367137, + "learning_rate": 9.730686061108206e-07, + "loss": 0.5207145690917969, + "step": 4600 + }, + { + "epoch": 0.13197867706064428, + "grad_norm": 20.957038540043612, + "learning_rate": 9.72993422894381e-07, + "loss": 0.46895484924316405, + "step": 4605 + }, + { + "epoch": 0.13212197638427148, + "grad_norm": 29.320384601434387, + "learning_rate": 9.729181377939825e-07, + "loss": 0.5442482471466065, + "step": 4610 + }, + { + "epoch": 0.13226527570789867, + "grad_norm": 16.878155731522202, + "learning_rate": 9.72842750825842e-07, + "loss": 0.48004660606384275, + "step": 4615 + }, + { + "epoch": 0.13240857503152584, + "grad_norm": 14.83323849096497, + "learning_rate": 9.72767262006198e-07, + "loss": 0.4698190689086914, + "step": 4620 + }, + { + "epoch": 0.13255187435515303, + "grad_norm": 18.371496197473252, + "learning_rate": 9.726916713513107e-07, + "loss": 0.5007077217102051, + "step": 4625 + }, + { + "epoch": 0.13269517367878023, + "grad_norm": 32.24381396108504, + "learning_rate": 9.726159788774628e-07, + "loss": 0.4910573482513428, + "step": 4630 + }, + { + "epoch": 0.13283847300240742, + "grad_norm": 20.778917576273646, + "learning_rate": 9.725401846009587e-07, + "loss": 0.4990230560302734, + "step": 4635 + }, + { + "epoch": 0.13298177232603461, + "grad_norm": 22.056347487246615, + "learning_rate": 9.724642885381243e-07, + "loss": 0.5154306411743164, + "step": 4640 + }, + { + "epoch": 0.1331250716496618, + "grad_norm": 23.687971965547195, + "learning_rate": 9.723882907053083e-07, + "loss": 0.5162612915039062, + "step": 4645 + }, + { + "epoch": 0.133268370973289, + "grad_norm": 33.181874803897465, + "learning_rate": 9.723121911188803e-07, + "loss": 0.5080151557922363, + "step": 4650 + }, + { + "epoch": 0.1334116702969162, + "grad_norm": 43.778972138298435, + "learning_rate": 9.722359897952328e-07, + "loss": 0.48526363372802733, + "step": 4655 + }, + { + "epoch": 0.1335549696205434, + "grad_norm": 19.857905265050906, + "learning_rate": 9.721596867507796e-07, + "loss": 0.4619903564453125, + "step": 4660 + }, + { + "epoch": 0.13369826894417058, + "grad_norm": 24.497441026723514, + "learning_rate": 9.720832820019561e-07, + "loss": 0.5051339149475098, + "step": 4665 + }, + { + "epoch": 0.13384156826779778, + "grad_norm": 17.904443370690807, + "learning_rate": 9.72006775565221e-07, + "loss": 0.5117093086242676, + "step": 4670 + }, + { + "epoch": 0.13398486759142497, + "grad_norm": 25.081307192223605, + "learning_rate": 9.719301674570533e-07, + "loss": 0.4844047546386719, + "step": 4675 + }, + { + "epoch": 0.13412816691505217, + "grad_norm": 16.638957073805212, + "learning_rate": 9.718534576939546e-07, + "loss": 0.510632848739624, + "step": 4680 + }, + { + "epoch": 0.13427146623867936, + "grad_norm": 11.932699231498903, + "learning_rate": 9.717766462924487e-07, + "loss": 0.518170690536499, + "step": 4685 + }, + { + "epoch": 0.13441476556230655, + "grad_norm": 12.174077764032681, + "learning_rate": 9.716997332690807e-07, + "loss": 0.48838605880737307, + "step": 4690 + }, + { + "epoch": 0.13455806488593375, + "grad_norm": 187.3235161501475, + "learning_rate": 9.71622718640418e-07, + "loss": 0.46824088096618655, + "step": 4695 + }, + { + "epoch": 0.13470136420956094, + "grad_norm": 21.075705468182, + "learning_rate": 9.715456024230497e-07, + "loss": 0.47347316741943357, + "step": 4700 + }, + { + "epoch": 0.13484466353318814, + "grad_norm": 14.58619437826438, + "learning_rate": 9.714683846335868e-07, + "loss": 0.5104803085327149, + "step": 4705 + }, + { + "epoch": 0.1349879628568153, + "grad_norm": 33.77154459685988, + "learning_rate": 9.71391065288662e-07, + "loss": 0.5249171257019043, + "step": 4710 + }, + { + "epoch": 0.1351312621804425, + "grad_norm": 20.742549173510856, + "learning_rate": 9.713136444049305e-07, + "loss": 0.516994571685791, + "step": 4715 + }, + { + "epoch": 0.1352745615040697, + "grad_norm": 19.328477244812564, + "learning_rate": 9.712361219990688e-07, + "loss": 0.5117194652557373, + "step": 4720 + }, + { + "epoch": 0.13541786082769688, + "grad_norm": 18.53726992776087, + "learning_rate": 9.711584980877754e-07, + "loss": 0.48290290832519533, + "step": 4725 + }, + { + "epoch": 0.13556116015132408, + "grad_norm": 57.098815948762294, + "learning_rate": 9.710807726877705e-07, + "loss": 0.4988711357116699, + "step": 4730 + }, + { + "epoch": 0.13570445947495127, + "grad_norm": 37.79930522646733, + "learning_rate": 9.710029458157964e-07, + "loss": 0.4880092620849609, + "step": 4735 + }, + { + "epoch": 0.13584775879857847, + "grad_norm": 19.684492399467917, + "learning_rate": 9.709250174886176e-07, + "loss": 0.49373273849487304, + "step": 4740 + }, + { + "epoch": 0.13599105812220566, + "grad_norm": 15.824824038013592, + "learning_rate": 9.708469877230195e-07, + "loss": 0.5003787040710449, + "step": 4745 + }, + { + "epoch": 0.13613435744583285, + "grad_norm": 15.230793496551383, + "learning_rate": 9.707688565358104e-07, + "loss": 0.4792490482330322, + "step": 4750 + }, + { + "epoch": 0.13627765676946005, + "grad_norm": 18.27042963122755, + "learning_rate": 9.706906239438194e-07, + "loss": 0.49028782844543456, + "step": 4755 + }, + { + "epoch": 0.13642095609308724, + "grad_norm": 19.747032443388928, + "learning_rate": 9.706122899638984e-07, + "loss": 0.5019127368927002, + "step": 4760 + }, + { + "epoch": 0.13656425541671444, + "grad_norm": 29.031362993927115, + "learning_rate": 9.705338546129207e-07, + "loss": 0.49912223815917967, + "step": 4765 + }, + { + "epoch": 0.13670755474034163, + "grad_norm": 22.369952670118447, + "learning_rate": 9.704553179077814e-07, + "loss": 0.4927377223968506, + "step": 4770 + }, + { + "epoch": 0.13685085406396882, + "grad_norm": 16.580921724009137, + "learning_rate": 9.703766798653975e-07, + "loss": 0.46930551528930664, + "step": 4775 + }, + { + "epoch": 0.13699415338759602, + "grad_norm": 18.017383303910776, + "learning_rate": 9.70297940502708e-07, + "loss": 0.5236422061920166, + "step": 4780 + }, + { + "epoch": 0.1371374527112232, + "grad_norm": 14.020381333968796, + "learning_rate": 9.70219099836673e-07, + "loss": 0.4743513107299805, + "step": 4785 + }, + { + "epoch": 0.1372807520348504, + "grad_norm": 15.139322243532161, + "learning_rate": 9.701401578842756e-07, + "loss": 0.4708244800567627, + "step": 4790 + }, + { + "epoch": 0.1374240513584776, + "grad_norm": 13.611944706329444, + "learning_rate": 9.700611146625197e-07, + "loss": 0.47497267723083497, + "step": 4795 + }, + { + "epoch": 0.1375673506821048, + "grad_norm": 16.9120666067039, + "learning_rate": 9.699819701884319e-07, + "loss": 0.5060768127441406, + "step": 4800 + }, + { + "epoch": 0.1375673506821048, + "eval_bfov_iou": 0.787988294717137, + "eval_bfov_iou@0.1": 0.96, + "eval_bfov_iou@0.25": 0.96, + "eval_bfov_iou@0.5": 0.956, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5165714285714286, + "eval_exact_match": 0.371, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 361.9567, + "eval_samples_per_second": 5.526, + "eval_steps_per_second": 0.174, + "eval_task_acc_absolute_direction_mc": 0.796, + "eval_task_acc_camera_rotation_transform_mc": 0.288, + "eval_task_acc_object_conditioned_reorientation_mc": 0.344, + "eval_task_acc_observer_distance_choice": 0.576, + "eval_task_acc_relative_3d_position_mc": 0.512, + "eval_task_acc_relative_direction_mc": 0.416, + "eval_task_acc_seam_continuity_mc": 0.684, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.956, + "eval_task_bfov_iou_referring_grounding_bfov": 0.787988294717137, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 4800 + }, + { + "epoch": 0.13771065000573196, + "grad_norm": 19.83559293214104, + "learning_rate": 9.699027244790596e-07, + "loss": 0.5190639972686768, + "step": 4805 + }, + { + "epoch": 0.13785394932935915, + "grad_norm": 16.52553581973199, + "learning_rate": 9.698233775514727e-07, + "loss": 0.47678437232971194, + "step": 4810 + }, + { + "epoch": 0.13799724865298635, + "grad_norm": 29.728843954799625, + "learning_rate": 9.697439294227626e-07, + "loss": 0.4892725944519043, + "step": 4815 + }, + { + "epoch": 0.13814054797661354, + "grad_norm": 10.504487620769096, + "learning_rate": 9.696643801100429e-07, + "loss": 0.49016690254211426, + "step": 4820 + }, + { + "epoch": 0.13828384730024074, + "grad_norm": 30.213419610306957, + "learning_rate": 9.695847296304485e-07, + "loss": 0.5165000915527344, + "step": 4825 + }, + { + "epoch": 0.13842714662386793, + "grad_norm": 18.744383086420395, + "learning_rate": 9.695049780011363e-07, + "loss": 0.5053626537322998, + "step": 4830 + }, + { + "epoch": 0.13857044594749512, + "grad_norm": 16.29708261138083, + "learning_rate": 9.694251252392853e-07, + "loss": 0.4964704990386963, + "step": 4835 + }, + { + "epoch": 0.13871374527112232, + "grad_norm": 13.94691048055298, + "learning_rate": 9.693451713620956e-07, + "loss": 0.5092603206634522, + "step": 4840 + }, + { + "epoch": 0.1388570445947495, + "grad_norm": 33.95490735148, + "learning_rate": 9.692651163867898e-07, + "loss": 0.47959070205688475, + "step": 4845 + }, + { + "epoch": 0.1390003439183767, + "grad_norm": 25.77356242754255, + "learning_rate": 9.691849603306116e-07, + "loss": 0.517023229598999, + "step": 4850 + }, + { + "epoch": 0.1391436432420039, + "grad_norm": 59.31389445654952, + "learning_rate": 9.691047032108273e-07, + "loss": 0.5355507373809815, + "step": 4855 + }, + { + "epoch": 0.1392869425656311, + "grad_norm": 15.379902496961899, + "learning_rate": 9.690243450447238e-07, + "loss": 0.5154154777526856, + "step": 4860 + }, + { + "epoch": 0.1394302418892583, + "grad_norm": 17.516548042259355, + "learning_rate": 9.689438858496111e-07, + "loss": 0.4845101356506348, + "step": 4865 + }, + { + "epoch": 0.13957354121288548, + "grad_norm": 12.934430968850247, + "learning_rate": 9.688633256428199e-07, + "loss": 0.46013898849487306, + "step": 4870 + }, + { + "epoch": 0.13971684053651268, + "grad_norm": 35.83814607962086, + "learning_rate": 9.68782664441703e-07, + "loss": 0.4999227046966553, + "step": 4875 + }, + { + "epoch": 0.13986013986013987, + "grad_norm": 18.13102920527004, + "learning_rate": 9.687019022636355e-07, + "loss": 0.4830134391784668, + "step": 4880 + }, + { + "epoch": 0.14000343918376706, + "grad_norm": 43.55086833733772, + "learning_rate": 9.686210391260134e-07, + "loss": 0.4730729579925537, + "step": 4885 + }, + { + "epoch": 0.14014673850739426, + "grad_norm": 26.81813941043641, + "learning_rate": 9.68540075046255e-07, + "loss": 0.49958410263061526, + "step": 4890 + }, + { + "epoch": 0.14029003783102142, + "grad_norm": 22.589857081069233, + "learning_rate": 9.684590100417997e-07, + "loss": 0.4465932846069336, + "step": 4895 + }, + { + "epoch": 0.14043333715464862, + "grad_norm": 19.448253724793997, + "learning_rate": 9.683778441301098e-07, + "loss": 0.4670268058776855, + "step": 4900 + }, + { + "epoch": 0.1405766364782758, + "grad_norm": 19.974158789477602, + "learning_rate": 9.682965773286684e-07, + "loss": 0.4971534252166748, + "step": 4905 + }, + { + "epoch": 0.140719935801903, + "grad_norm": 24.12390201010807, + "learning_rate": 9.682152096549802e-07, + "loss": 0.49178924560546877, + "step": 4910 + }, + { + "epoch": 0.1408632351255302, + "grad_norm": 18.12974051202282, + "learning_rate": 9.681337411265725e-07, + "loss": 0.4720099449157715, + "step": 4915 + }, + { + "epoch": 0.1410065344491574, + "grad_norm": 17.261108335682703, + "learning_rate": 9.680521717609938e-07, + "loss": 0.48800973892211913, + "step": 4920 + }, + { + "epoch": 0.1411498337727846, + "grad_norm": 69.90131776359225, + "learning_rate": 9.679705015758138e-07, + "loss": 0.5038124084472656, + "step": 4925 + }, + { + "epoch": 0.14129313309641178, + "grad_norm": 91.2047250078418, + "learning_rate": 9.678887305886249e-07, + "loss": 0.4877742290496826, + "step": 4930 + }, + { + "epoch": 0.14143643242003898, + "grad_norm": 13.370802634441706, + "learning_rate": 9.678068588170407e-07, + "loss": 0.5111656188964844, + "step": 4935 + }, + { + "epoch": 0.14157973174366617, + "grad_norm": 15.251368548010506, + "learning_rate": 9.677248862786968e-07, + "loss": 0.5088668823242187, + "step": 4940 + }, + { + "epoch": 0.14172303106729336, + "grad_norm": 20.733203083105845, + "learning_rate": 9.676428129912498e-07, + "loss": 0.49605369567871094, + "step": 4945 + }, + { + "epoch": 0.14186633039092056, + "grad_norm": 41.61818611361959, + "learning_rate": 9.67560638972379e-07, + "loss": 0.492279577255249, + "step": 4950 + }, + { + "epoch": 0.14200962971454775, + "grad_norm": 21.94298444153533, + "learning_rate": 9.674783642397844e-07, + "loss": 0.460846996307373, + "step": 4955 + }, + { + "epoch": 0.14215292903817495, + "grad_norm": 67.13038930718784, + "learning_rate": 9.673959888111885e-07, + "loss": 0.4584623336791992, + "step": 4960 + }, + { + "epoch": 0.14229622836180214, + "grad_norm": 25.954857234671625, + "learning_rate": 9.673135127043351e-07, + "loss": 0.5130414009094239, + "step": 4965 + }, + { + "epoch": 0.14243952768542933, + "grad_norm": 20.484295570330747, + "learning_rate": 9.672309359369897e-07, + "loss": 0.5058229923248291, + "step": 4970 + }, + { + "epoch": 0.14258282700905653, + "grad_norm": 24.089946248662102, + "learning_rate": 9.671482585269398e-07, + "loss": 0.501746940612793, + "step": 4975 + }, + { + "epoch": 0.14272612633268372, + "grad_norm": 36.28054762864382, + "learning_rate": 9.670654804919937e-07, + "loss": 0.4628440856933594, + "step": 4980 + }, + { + "epoch": 0.1428694256563109, + "grad_norm": 16.531567926061463, + "learning_rate": 9.669826018499829e-07, + "loss": 0.48522610664367677, + "step": 4985 + }, + { + "epoch": 0.14301272497993808, + "grad_norm": 51.69515514419876, + "learning_rate": 9.66899622618759e-07, + "loss": 0.5246840953826905, + "step": 4990 + }, + { + "epoch": 0.14315602430356528, + "grad_norm": 17.550266318759967, + "learning_rate": 9.66816542816196e-07, + "loss": 0.4782232761383057, + "step": 4995 + }, + { + "epoch": 0.14329932362719247, + "grad_norm": 16.73222839997114, + "learning_rate": 9.667333624601897e-07, + "loss": 0.5041857719421386, + "step": 5000 + }, + { + "epoch": 0.14344262295081966, + "grad_norm": 21.93567529244785, + "learning_rate": 9.666500815686571e-07, + "loss": 0.5015527725219726, + "step": 5005 + }, + { + "epoch": 0.14358592227444686, + "grad_norm": 22.814986804702045, + "learning_rate": 9.665667001595375e-07, + "loss": 0.4759490966796875, + "step": 5010 + }, + { + "epoch": 0.14372922159807405, + "grad_norm": 32.133567868172655, + "learning_rate": 9.66483218250791e-07, + "loss": 0.46779403686523435, + "step": 5015 + }, + { + "epoch": 0.14387252092170125, + "grad_norm": 21.728389431781828, + "learning_rate": 9.663996358604002e-07, + "loss": 0.5280585765838623, + "step": 5020 + }, + { + "epoch": 0.14401582024532844, + "grad_norm": 19.566837163731385, + "learning_rate": 9.663159530063688e-07, + "loss": 0.4742094039916992, + "step": 5025 + }, + { + "epoch": 0.14415911956895563, + "grad_norm": 50.85455684267282, + "learning_rate": 9.662321697067222e-07, + "loss": 0.4777994632720947, + "step": 5030 + }, + { + "epoch": 0.14430241889258283, + "grad_norm": 31.36700252809073, + "learning_rate": 9.661482859795077e-07, + "loss": 0.5096506118774414, + "step": 5035 + }, + { + "epoch": 0.14444571821621002, + "grad_norm": 26.124847639304473, + "learning_rate": 9.66064301842794e-07, + "loss": 0.4866472244262695, + "step": 5040 + }, + { + "epoch": 0.14458901753983722, + "grad_norm": 30.37528838776925, + "learning_rate": 9.659802173146713e-07, + "loss": 0.504782772064209, + "step": 5045 + }, + { + "epoch": 0.1447323168634644, + "grad_norm": 15.047415672417811, + "learning_rate": 9.65896032413252e-07, + "loss": 0.5105010986328125, + "step": 5050 + }, + { + "epoch": 0.1448756161870916, + "grad_norm": 21.06173830165819, + "learning_rate": 9.658117471566696e-07, + "loss": 0.49747819900512696, + "step": 5055 + }, + { + "epoch": 0.1450189155107188, + "grad_norm": 27.70902055825546, + "learning_rate": 9.65727361563079e-07, + "loss": 0.47939023971557615, + "step": 5060 + }, + { + "epoch": 0.145162214834346, + "grad_norm": 25.288884317790615, + "learning_rate": 9.656428756506576e-07, + "loss": 0.4909358978271484, + "step": 5065 + }, + { + "epoch": 0.1453055141579732, + "grad_norm": 14.569348081425426, + "learning_rate": 9.655582894376036e-07, + "loss": 0.46135830879211426, + "step": 5070 + }, + { + "epoch": 0.14544881348160035, + "grad_norm": 26.81074598761814, + "learning_rate": 9.65473602942137e-07, + "loss": 0.5287693977355957, + "step": 5075 + }, + { + "epoch": 0.14559211280522755, + "grad_norm": 25.507781242490278, + "learning_rate": 9.653888161824996e-07, + "loss": 0.45789284706115724, + "step": 5080 + }, + { + "epoch": 0.14573541212885474, + "grad_norm": 32.84338737661101, + "learning_rate": 9.653039291769548e-07, + "loss": 0.5289116859436035, + "step": 5085 + }, + { + "epoch": 0.14587871145248194, + "grad_norm": 18.629436879609113, + "learning_rate": 9.652189419437873e-07, + "loss": 0.5244021415710449, + "step": 5090 + }, + { + "epoch": 0.14602201077610913, + "grad_norm": 29.55310534904773, + "learning_rate": 9.651338545013034e-07, + "loss": 0.46414766311645506, + "step": 5095 + }, + { + "epoch": 0.14616531009973632, + "grad_norm": 14.016915505540526, + "learning_rate": 9.650486668678316e-07, + "loss": 0.4474936485290527, + "step": 5100 + }, + { + "epoch": 0.14616531009973632, + "eval_bfov_iou": 0.7851945589829961, + "eval_bfov_iou@0.1": 0.976, + "eval_bfov_iou@0.25": 0.976, + "eval_bfov_iou@0.5": 0.968, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5611428571428572, + "eval_exact_match": 0.3205, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 392.9348, + "eval_samples_per_second": 5.09, + "eval_steps_per_second": 0.16, + "eval_task_acc_absolute_direction_mc": 0.832, + "eval_task_acc_camera_rotation_transform_mc": 0.4, + "eval_task_acc_object_conditioned_reorientation_mc": 0.404, + "eval_task_acc_observer_distance_choice": 0.608, + "eval_task_acc_relative_3d_position_mc": 0.508, + "eval_task_acc_relative_direction_mc": 0.492, + "eval_task_acc_seam_continuity_mc": 0.684, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.976, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7851945589829961, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 5100 + }, + { + "epoch": 0.14630860942336352, + "grad_norm": 13.601173501200627, + "learning_rate": 9.64963379061721e-07, + "loss": 0.5324724197387696, + "step": 5105 + }, + { + "epoch": 0.1464519087469907, + "grad_norm": 16.550071679457016, + "learning_rate": 9.648779911013434e-07, + "loss": 0.4728814125061035, + "step": 5110 + }, + { + "epoch": 0.1465952080706179, + "grad_norm": 53.77223906679079, + "learning_rate": 9.647925030050912e-07, + "loss": 0.4594442367553711, + "step": 5115 + }, + { + "epoch": 0.1467385073942451, + "grad_norm": 96.24563668379298, + "learning_rate": 9.647069147913786e-07, + "loss": 0.5005455017089844, + "step": 5120 + }, + { + "epoch": 0.1468818067178723, + "grad_norm": 23.213061948450942, + "learning_rate": 9.646212264786418e-07, + "loss": 0.5215416431427002, + "step": 5125 + }, + { + "epoch": 0.1470251060414995, + "grad_norm": 14.467893463577337, + "learning_rate": 9.645354380853384e-07, + "loss": 0.4891940116882324, + "step": 5130 + }, + { + "epoch": 0.14716840536512668, + "grad_norm": 31.95740742264265, + "learning_rate": 9.64449549629947e-07, + "loss": 0.4742134094238281, + "step": 5135 + }, + { + "epoch": 0.14731170468875388, + "grad_norm": 26.100259692197252, + "learning_rate": 9.643635611309685e-07, + "loss": 0.4917646884918213, + "step": 5140 + }, + { + "epoch": 0.14745500401238107, + "grad_norm": 23.56713514074692, + "learning_rate": 9.64277472606925e-07, + "loss": 0.511807632446289, + "step": 5145 + }, + { + "epoch": 0.14759830333600826, + "grad_norm": 20.480226570477413, + "learning_rate": 9.6419128407636e-07, + "loss": 0.48923287391662595, + "step": 5150 + }, + { + "epoch": 0.14774160265963546, + "grad_norm": 19.09903926971639, + "learning_rate": 9.64104995557839e-07, + "loss": 0.4906296730041504, + "step": 5155 + }, + { + "epoch": 0.14788490198326265, + "grad_norm": 17.095390628135934, + "learning_rate": 9.640186070699485e-07, + "loss": 0.5110513687133789, + "step": 5160 + }, + { + "epoch": 0.14802820130688985, + "grad_norm": 17.660553570821456, + "learning_rate": 9.63932118631297e-07, + "loss": 0.477280330657959, + "step": 5165 + }, + { + "epoch": 0.148171500630517, + "grad_norm": 27.248970172882153, + "learning_rate": 9.638455302605143e-07, + "loss": 0.4826923370361328, + "step": 5170 + }, + { + "epoch": 0.1483147999541442, + "grad_norm": 15.53949096172831, + "learning_rate": 9.637588419762515e-07, + "loss": 0.498883581161499, + "step": 5175 + }, + { + "epoch": 0.1484580992777714, + "grad_norm": 10.931152103023537, + "learning_rate": 9.636720537971818e-07, + "loss": 0.4918032169342041, + "step": 5180 + }, + { + "epoch": 0.1486013986013986, + "grad_norm": 19.626880744877816, + "learning_rate": 9.635851657419994e-07, + "loss": 0.48644218444824217, + "step": 5185 + }, + { + "epoch": 0.1487446979250258, + "grad_norm": 25.632867576478155, + "learning_rate": 9.634981778294204e-07, + "loss": 0.4950981616973877, + "step": 5190 + }, + { + "epoch": 0.14888799724865298, + "grad_norm": 16.848110865607328, + "learning_rate": 9.63411090078182e-07, + "loss": 0.460736083984375, + "step": 5195 + }, + { + "epoch": 0.14903129657228018, + "grad_norm": 18.690134802733507, + "learning_rate": 9.63323902507043e-07, + "loss": 0.4897314071655273, + "step": 5200 + }, + { + "epoch": 0.14917459589590737, + "grad_norm": 11.987830424751005, + "learning_rate": 9.632366151347842e-07, + "loss": 0.5023289203643799, + "step": 5205 + }, + { + "epoch": 0.14931789521953456, + "grad_norm": 19.284434045916946, + "learning_rate": 9.631492279802072e-07, + "loss": 0.5040738105773925, + "step": 5210 + }, + { + "epoch": 0.14946119454316176, + "grad_norm": 43.99592617254368, + "learning_rate": 9.630617410621358e-07, + "loss": 0.4754795551300049, + "step": 5215 + }, + { + "epoch": 0.14960449386678895, + "grad_norm": 16.510299672451186, + "learning_rate": 9.629741543994143e-07, + "loss": 0.4774524211883545, + "step": 5220 + }, + { + "epoch": 0.14974779319041615, + "grad_norm": 14.285813534132442, + "learning_rate": 9.628864680109095e-07, + "loss": 0.48259744644165037, + "step": 5225 + }, + { + "epoch": 0.14989109251404334, + "grad_norm": 13.81246499505297, + "learning_rate": 9.627986819155093e-07, + "loss": 0.46251440048217773, + "step": 5230 + }, + { + "epoch": 0.15003439183767053, + "grad_norm": 55.79970022219391, + "learning_rate": 9.627107961321228e-07, + "loss": 0.4420746326446533, + "step": 5235 + }, + { + "epoch": 0.15017769116129773, + "grad_norm": 13.609065086173857, + "learning_rate": 9.626228106796809e-07, + "loss": 0.48780040740966796, + "step": 5240 + }, + { + "epoch": 0.15032099048492492, + "grad_norm": 17.26487399315407, + "learning_rate": 9.62534725577136e-07, + "loss": 0.48295068740844727, + "step": 5245 + }, + { + "epoch": 0.15046428980855212, + "grad_norm": 17.034034300299947, + "learning_rate": 9.624465408434618e-07, + "loss": 0.49605159759521483, + "step": 5250 + }, + { + "epoch": 0.1506075891321793, + "grad_norm": 19.371269035241212, + "learning_rate": 9.623582564976537e-07, + "loss": 0.4725840091705322, + "step": 5255 + }, + { + "epoch": 0.15075088845580648, + "grad_norm": 18.99691095518913, + "learning_rate": 9.62269872558728e-07, + "loss": 0.5044740676879883, + "step": 5260 + }, + { + "epoch": 0.15089418777943367, + "grad_norm": 36.74340215161051, + "learning_rate": 9.621813890457229e-07, + "loss": 0.5094461441040039, + "step": 5265 + }, + { + "epoch": 0.15103748710306086, + "grad_norm": 15.955348035099249, + "learning_rate": 9.62092805977698e-07, + "loss": 0.47185344696044923, + "step": 5270 + }, + { + "epoch": 0.15118078642668806, + "grad_norm": 34.19966516695217, + "learning_rate": 9.620041233737343e-07, + "loss": 0.48040108680725097, + "step": 5275 + }, + { + "epoch": 0.15132408575031525, + "grad_norm": 17.570422066330593, + "learning_rate": 9.619153412529345e-07, + "loss": 0.49138031005859373, + "step": 5280 + }, + { + "epoch": 0.15146738507394245, + "grad_norm": 20.772771045764244, + "learning_rate": 9.618264596344224e-07, + "loss": 0.5231310844421386, + "step": 5285 + }, + { + "epoch": 0.15161068439756964, + "grad_norm": 26.89916316877698, + "learning_rate": 9.61737478537343e-07, + "loss": 0.499554443359375, + "step": 5290 + }, + { + "epoch": 0.15175398372119683, + "grad_norm": 25.334623914687715, + "learning_rate": 9.616483979808632e-07, + "loss": 0.49796133041381835, + "step": 5295 + }, + { + "epoch": 0.15189728304482403, + "grad_norm": 13.929944718748862, + "learning_rate": 9.615592179841714e-07, + "loss": 0.4582359313964844, + "step": 5300 + }, + { + "epoch": 0.15204058236845122, + "grad_norm": 21.016070039630645, + "learning_rate": 9.61469938566477e-07, + "loss": 0.4912844181060791, + "step": 5305 + }, + { + "epoch": 0.15218388169207842, + "grad_norm": 14.543428439528379, + "learning_rate": 9.61380559747011e-07, + "loss": 0.514399528503418, + "step": 5310 + }, + { + "epoch": 0.1523271810157056, + "grad_norm": 17.037967263705664, + "learning_rate": 9.61291081545026e-07, + "loss": 0.5124261379241943, + "step": 5315 + }, + { + "epoch": 0.1524704803393328, + "grad_norm": 18.34599549517184, + "learning_rate": 9.612015039797957e-07, + "loss": 0.5273198127746582, + "step": 5320 + }, + { + "epoch": 0.15261377966296, + "grad_norm": 28.89087409219422, + "learning_rate": 9.61111827070615e-07, + "loss": 0.5110832691192627, + "step": 5325 + }, + { + "epoch": 0.1527570789865872, + "grad_norm": 25.773328750619207, + "learning_rate": 9.610220508368011e-07, + "loss": 0.5138680934906006, + "step": 5330 + }, + { + "epoch": 0.15290037831021439, + "grad_norm": 15.900712582908778, + "learning_rate": 9.60932175297692e-07, + "loss": 0.4864922046661377, + "step": 5335 + }, + { + "epoch": 0.15304367763384158, + "grad_norm": 28.55155655707502, + "learning_rate": 9.608422004726467e-07, + "loss": 0.4851415157318115, + "step": 5340 + }, + { + "epoch": 0.15318697695746877, + "grad_norm": 26.093107954433627, + "learning_rate": 9.60752126381046e-07, + "loss": 0.5044075012207031, + "step": 5345 + }, + { + "epoch": 0.15333027628109594, + "grad_norm": 16.739523785041804, + "learning_rate": 9.606619530422925e-07, + "loss": 0.44365510940551756, + "step": 5350 + }, + { + "epoch": 0.15347357560472313, + "grad_norm": 17.693817289602435, + "learning_rate": 9.605716804758095e-07, + "loss": 0.4771699905395508, + "step": 5355 + }, + { + "epoch": 0.15361687492835033, + "grad_norm": 23.458193116654304, + "learning_rate": 9.604813087010419e-07, + "loss": 0.5289233207702637, + "step": 5360 + }, + { + "epoch": 0.15376017425197752, + "grad_norm": 17.904608689661973, + "learning_rate": 9.603908377374562e-07, + "loss": 0.496568489074707, + "step": 5365 + }, + { + "epoch": 0.15390347357560472, + "grad_norm": 14.90862887985881, + "learning_rate": 9.603002676045396e-07, + "loss": 0.47331809997558594, + "step": 5370 + }, + { + "epoch": 0.1540467728992319, + "grad_norm": 18.97365214586352, + "learning_rate": 9.602095983218018e-07, + "loss": 0.5154491901397705, + "step": 5375 + }, + { + "epoch": 0.1541900722228591, + "grad_norm": 29.30477311359636, + "learning_rate": 9.60118829908773e-07, + "loss": 0.467680549621582, + "step": 5380 + }, + { + "epoch": 0.1543333715464863, + "grad_norm": 12.734499440510591, + "learning_rate": 9.600279623850046e-07, + "loss": 0.48137311935424804, + "step": 5385 + }, + { + "epoch": 0.1544766708701135, + "grad_norm": 24.104678727555626, + "learning_rate": 9.599369957700698e-07, + "loss": 0.5029919624328614, + "step": 5390 + }, + { + "epoch": 0.15461997019374069, + "grad_norm": 38.24642226534957, + "learning_rate": 9.59845930083563e-07, + "loss": 0.5086793899536133, + "step": 5395 + }, + { + "epoch": 0.15476326951736788, + "grad_norm": 21.981928723529904, + "learning_rate": 9.597547653451005e-07, + "loss": 0.48301944732666013, + "step": 5400 + }, + { + "epoch": 0.15476326951736788, + "eval_bfov_iou": 0.7104059040677452, + "eval_bfov_iou@0.1": 0.904, + "eval_bfov_iou@0.25": 0.884, + "eval_bfov_iou@0.5": 0.876, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5434285714285715, + "eval_exact_match": 0.383, + "eval_invalid_choice_rate": 0.0005714285714285715, + "eval_runtime": 416.8254, + "eval_samples_per_second": 4.798, + "eval_steps_per_second": 0.151, + "eval_task_acc_absolute_direction_mc": 0.824, + "eval_task_acc_camera_rotation_transform_mc": 0.308, + "eval_task_acc_object_conditioned_reorientation_mc": 0.392, + "eval_task_acc_observer_distance_choice": 0.612, + "eval_task_acc_relative_3d_position_mc": 0.56, + "eval_task_acc_relative_direction_mc": 0.44, + "eval_task_acc_seam_continuity_mc": 0.668, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.904, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.884, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.876, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7104059040677452, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 5400 + }, + { + "epoch": 0.15490656884099507, + "grad_norm": 12.76988398867348, + "learning_rate": 9.596635015743188e-07, + "loss": 0.5534495353698731, + "step": 5405 + }, + { + "epoch": 0.15504986816462227, + "grad_norm": 13.262622471420258, + "learning_rate": 9.595721387908766e-07, + "loss": 0.5246593475341796, + "step": 5410 + }, + { + "epoch": 0.15519316748824946, + "grad_norm": 13.796427410956166, + "learning_rate": 9.594806770144538e-07, + "loss": 0.4665219306945801, + "step": 5415 + }, + { + "epoch": 0.15533646681187666, + "grad_norm": 14.924792428709248, + "learning_rate": 9.593891162647511e-07, + "loss": 0.4750338554382324, + "step": 5420 + }, + { + "epoch": 0.15547976613550385, + "grad_norm": 21.715100760161576, + "learning_rate": 9.592974565614913e-07, + "loss": 0.501518726348877, + "step": 5425 + }, + { + "epoch": 0.15562306545913104, + "grad_norm": 14.01216338776038, + "learning_rate": 9.592056979244178e-07, + "loss": 0.5263134479522705, + "step": 5430 + }, + { + "epoch": 0.15576636478275824, + "grad_norm": 27.67903042628267, + "learning_rate": 9.59113840373296e-07, + "loss": 0.4878545761108398, + "step": 5435 + }, + { + "epoch": 0.15590966410638543, + "grad_norm": 12.74487427300849, + "learning_rate": 9.590218839279118e-07, + "loss": 0.46703414916992186, + "step": 5440 + }, + { + "epoch": 0.1560529634300126, + "grad_norm": 31.35558365926776, + "learning_rate": 9.589298286080733e-07, + "loss": 0.5329798221588135, + "step": 5445 + }, + { + "epoch": 0.1561962627536398, + "grad_norm": 13.484834821556111, + "learning_rate": 9.588376744336092e-07, + "loss": 0.455476713180542, + "step": 5450 + }, + { + "epoch": 0.15633956207726699, + "grad_norm": 21.733935448388408, + "learning_rate": 9.587454214243698e-07, + "loss": 0.5100439071655274, + "step": 5455 + }, + { + "epoch": 0.15648286140089418, + "grad_norm": 13.364827157821827, + "learning_rate": 9.586530696002265e-07, + "loss": 0.4834928512573242, + "step": 5460 + }, + { + "epoch": 0.15662616072452137, + "grad_norm": 10.655692318546178, + "learning_rate": 9.585606189810724e-07, + "loss": 0.4804999351501465, + "step": 5465 + }, + { + "epoch": 0.15676946004814857, + "grad_norm": 12.56288319658444, + "learning_rate": 9.584680695868212e-07, + "loss": 0.48285541534423826, + "step": 5470 + }, + { + "epoch": 0.15691275937177576, + "grad_norm": 29.072807162456467, + "learning_rate": 9.583754214374088e-07, + "loss": 0.5558177947998046, + "step": 5475 + }, + { + "epoch": 0.15705605869540296, + "grad_norm": 35.15302342662568, + "learning_rate": 9.582826745527913e-07, + "loss": 0.5123523712158203, + "step": 5480 + }, + { + "epoch": 0.15719935801903015, + "grad_norm": 14.087782180418651, + "learning_rate": 9.581898289529467e-07, + "loss": 0.45984177589416503, + "step": 5485 + }, + { + "epoch": 0.15734265734265734, + "grad_norm": 17.24282013188445, + "learning_rate": 9.580968846578745e-07, + "loss": 0.4955912590026855, + "step": 5490 + }, + { + "epoch": 0.15748595666628454, + "grad_norm": 14.850658993535909, + "learning_rate": 9.58003841687595e-07, + "loss": 0.4514634132385254, + "step": 5495 + }, + { + "epoch": 0.15762925598991173, + "grad_norm": 15.680804448274522, + "learning_rate": 9.579107000621496e-07, + "loss": 0.5073150157928467, + "step": 5500 + }, + { + "epoch": 0.15777255531353893, + "grad_norm": 16.405257733220655, + "learning_rate": 9.578174598016016e-07, + "loss": 0.5232337474822998, + "step": 5505 + }, + { + "epoch": 0.15791585463716612, + "grad_norm": 22.742283453619226, + "learning_rate": 9.57724120926035e-07, + "loss": 0.43845357894897463, + "step": 5510 + }, + { + "epoch": 0.1580591539607933, + "grad_norm": 23.25047688279613, + "learning_rate": 9.576306834555555e-07, + "loss": 0.49999251365661623, + "step": 5515 + }, + { + "epoch": 0.1582024532844205, + "grad_norm": 25.695166597712074, + "learning_rate": 9.575371474102893e-07, + "loss": 0.4657792091369629, + "step": 5520 + }, + { + "epoch": 0.1583457526080477, + "grad_norm": 12.249246383774553, + "learning_rate": 9.574435128103846e-07, + "loss": 0.47530083656311034, + "step": 5525 + }, + { + "epoch": 0.1584890519316749, + "grad_norm": 28.571408059623504, + "learning_rate": 9.573497796760104e-07, + "loss": 0.49605870246887207, + "step": 5530 + }, + { + "epoch": 0.15863235125530206, + "grad_norm": 57.41333937093257, + "learning_rate": 9.572559480273573e-07, + "loss": 0.4584352493286133, + "step": 5535 + }, + { + "epoch": 0.15877565057892926, + "grad_norm": 15.881715549939267, + "learning_rate": 9.571620178846364e-07, + "loss": 0.5104794502258301, + "step": 5540 + }, + { + "epoch": 0.15891894990255645, + "grad_norm": 16.554325290430533, + "learning_rate": 9.570679892680808e-07, + "loss": 0.4804971694946289, + "step": 5545 + }, + { + "epoch": 0.15906224922618364, + "grad_norm": 12.06856659265275, + "learning_rate": 9.569738621979446e-07, + "loss": 0.4986520290374756, + "step": 5550 + }, + { + "epoch": 0.15920554854981084, + "grad_norm": 24.794153712933227, + "learning_rate": 9.56879636694503e-07, + "loss": 0.5028439998626709, + "step": 5555 + }, + { + "epoch": 0.15934884787343803, + "grad_norm": 18.748794485596864, + "learning_rate": 9.56785312778052e-07, + "loss": 0.5113292694091797, + "step": 5560 + }, + { + "epoch": 0.15949214719706523, + "grad_norm": 25.41005045886998, + "learning_rate": 9.566908904689097e-07, + "loss": 0.48024682998657225, + "step": 5565 + }, + { + "epoch": 0.15963544652069242, + "grad_norm": 45.95110402193613, + "learning_rate": 9.565963697874145e-07, + "loss": 0.48197345733642577, + "step": 5570 + }, + { + "epoch": 0.15977874584431961, + "grad_norm": 16.014660624383435, + "learning_rate": 9.565017507539267e-07, + "loss": 0.4679136276245117, + "step": 5575 + }, + { + "epoch": 0.1599220451679468, + "grad_norm": 25.65032770924003, + "learning_rate": 9.564070333888271e-07, + "loss": 0.4399147033691406, + "step": 5580 + }, + { + "epoch": 0.160065344491574, + "grad_norm": 22.171981327391798, + "learning_rate": 9.563122177125186e-07, + "loss": 0.5000683307647705, + "step": 5585 + }, + { + "epoch": 0.1602086438152012, + "grad_norm": 31.010784099258064, + "learning_rate": 9.562173037454244e-07, + "loss": 0.5045644760131835, + "step": 5590 + }, + { + "epoch": 0.1603519431388284, + "grad_norm": 14.062634222898708, + "learning_rate": 9.56122291507989e-07, + "loss": 0.44838724136352537, + "step": 5595 + }, + { + "epoch": 0.16049524246245558, + "grad_norm": 12.094406755561954, + "learning_rate": 9.560271810206789e-07, + "loss": 0.488132381439209, + "step": 5600 + }, + { + "epoch": 0.16063854178608278, + "grad_norm": 24.479533853542026, + "learning_rate": 9.559319723039804e-07, + "loss": 0.4845831871032715, + "step": 5605 + }, + { + "epoch": 0.16078184110970997, + "grad_norm": 52.74759802052609, + "learning_rate": 9.558366653784022e-07, + "loss": 0.46910643577575684, + "step": 5610 + }, + { + "epoch": 0.16092514043333717, + "grad_norm": 36.0198870798656, + "learning_rate": 9.557412602644735e-07, + "loss": 0.5071182727813721, + "step": 5615 + }, + { + "epoch": 0.16106843975696436, + "grad_norm": 19.990368555781078, + "learning_rate": 9.556457569827447e-07, + "loss": 0.4478751659393311, + "step": 5620 + }, + { + "epoch": 0.16121173908059153, + "grad_norm": 17.81020756872046, + "learning_rate": 9.555501555537877e-07, + "loss": 0.4862050533294678, + "step": 5625 + }, + { + "epoch": 0.16135503840421872, + "grad_norm": 23.463206640648806, + "learning_rate": 9.55454455998195e-07, + "loss": 0.4984159469604492, + "step": 5630 + }, + { + "epoch": 0.16149833772784591, + "grad_norm": 48.11445726235823, + "learning_rate": 9.553586583365806e-07, + "loss": 0.47490243911743163, + "step": 5635 + }, + { + "epoch": 0.1616416370514731, + "grad_norm": 18.04984437703025, + "learning_rate": 9.552627625895796e-07, + "loss": 0.4684635639190674, + "step": 5640 + }, + { + "epoch": 0.1617849363751003, + "grad_norm": 12.0985728071987, + "learning_rate": 9.551667687778483e-07, + "loss": 0.4722273826599121, + "step": 5645 + }, + { + "epoch": 0.1619282356987275, + "grad_norm": 58.01689277139024, + "learning_rate": 9.550706769220639e-07, + "loss": 0.4726852893829346, + "step": 5650 + }, + { + "epoch": 0.1620715350223547, + "grad_norm": 88.67745683314425, + "learning_rate": 9.549744870429245e-07, + "loss": 0.5191467761993408, + "step": 5655 + }, + { + "epoch": 0.16221483434598188, + "grad_norm": 11.514655926714983, + "learning_rate": 9.5487819916115e-07, + "loss": 0.48065791130065916, + "step": 5660 + }, + { + "epoch": 0.16235813366960908, + "grad_norm": 22.411933147161346, + "learning_rate": 9.547818132974813e-07, + "loss": 0.47487220764160154, + "step": 5665 + }, + { + "epoch": 0.16250143299323627, + "grad_norm": 15.178589963306745, + "learning_rate": 9.546853294726797e-07, + "loss": 0.44351515769958494, + "step": 5670 + }, + { + "epoch": 0.16264473231686347, + "grad_norm": 22.640570098551084, + "learning_rate": 9.545887477075282e-07, + "loss": 0.49120235443115234, + "step": 5675 + }, + { + "epoch": 0.16278803164049066, + "grad_norm": 20.82045873280111, + "learning_rate": 9.544920680228309e-07, + "loss": 0.4763439178466797, + "step": 5680 + }, + { + "epoch": 0.16293133096411785, + "grad_norm": 23.006919224121656, + "learning_rate": 9.543952904394123e-07, + "loss": 0.5086928367614746, + "step": 5685 + }, + { + "epoch": 0.16307463028774505, + "grad_norm": 28.394669065977695, + "learning_rate": 9.542984149781192e-07, + "loss": 0.4763385772705078, + "step": 5690 + }, + { + "epoch": 0.16321792961137224, + "grad_norm": 18.053985547594337, + "learning_rate": 9.542014416598185e-07, + "loss": 0.48696246147155764, + "step": 5695 + }, + { + "epoch": 0.16336122893499944, + "grad_norm": 19.790356363127994, + "learning_rate": 9.541043705053986e-07, + "loss": 0.45038762092590334, + "step": 5700 + }, + { + "epoch": 0.16336122893499944, + "eval_bfov_iou": 0.7425043616119742, + "eval_bfov_iou@0.1": 0.956, + "eval_bfov_iou@0.25": 0.956, + "eval_bfov_iou@0.5": 0.944, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5651428571428572, + "eval_exact_match": 0.3745, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 509.7805, + "eval_samples_per_second": 3.923, + "eval_steps_per_second": 0.124, + "eval_task_acc_absolute_direction_mc": 0.796, + "eval_task_acc_camera_rotation_transform_mc": 0.308, + "eval_task_acc_object_conditioned_reorientation_mc": 0.432, + "eval_task_acc_observer_distance_choice": 0.624, + "eval_task_acc_relative_3d_position_mc": 0.552, + "eval_task_acc_relative_direction_mc": 0.536, + "eval_task_acc_seam_continuity_mc": 0.708, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.956, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.956, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.944, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7425043616119742, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 5700 + }, + { + "epoch": 0.16350452825862663, + "grad_norm": 16.263405145944677, + "learning_rate": 9.54007201535769e-07, + "loss": 0.5190417289733886, + "step": 5705 + }, + { + "epoch": 0.16364782758225382, + "grad_norm": 13.975236220710965, + "learning_rate": 9.539099347718595e-07, + "loss": 0.5151944160461426, + "step": 5710 + }, + { + "epoch": 0.163791126905881, + "grad_norm": 16.801108018904404, + "learning_rate": 9.538125702346224e-07, + "loss": 0.4688068389892578, + "step": 5715 + }, + { + "epoch": 0.16393442622950818, + "grad_norm": 33.01508793419409, + "learning_rate": 9.5371510794503e-07, + "loss": 0.458497142791748, + "step": 5720 + }, + { + "epoch": 0.16407772555313538, + "grad_norm": 12.961795096096493, + "learning_rate": 9.536175479240753e-07, + "loss": 0.5104208946228027, + "step": 5725 + }, + { + "epoch": 0.16422102487676257, + "grad_norm": 20.71867873453571, + "learning_rate": 9.535198901927739e-07, + "loss": 0.5000085353851318, + "step": 5730 + }, + { + "epoch": 0.16436432420038977, + "grad_norm": 24.441239776343735, + "learning_rate": 9.53422134772161e-07, + "loss": 0.46926207542419435, + "step": 5735 + }, + { + "epoch": 0.16450762352401696, + "grad_norm": 22.31641913328923, + "learning_rate": 9.533242816832936e-07, + "loss": 0.47144064903259275, + "step": 5740 + }, + { + "epoch": 0.16465092284764415, + "grad_norm": 22.5228963306184, + "learning_rate": 9.532263309472493e-07, + "loss": 0.49860758781433107, + "step": 5745 + }, + { + "epoch": 0.16479422217127135, + "grad_norm": 17.110922057424812, + "learning_rate": 9.53128282585127e-07, + "loss": 0.46269803047180175, + "step": 5750 + }, + { + "epoch": 0.16493752149489854, + "grad_norm": 11.790943162684597, + "learning_rate": 9.530301366180467e-07, + "loss": 0.5041066169738769, + "step": 5755 + }, + { + "epoch": 0.16508082081852574, + "grad_norm": 24.226081644823807, + "learning_rate": 9.52931893067149e-07, + "loss": 0.4682796478271484, + "step": 5760 + }, + { + "epoch": 0.16522412014215293, + "grad_norm": 16.54386098146435, + "learning_rate": 9.52833551953596e-07, + "loss": 0.529063606262207, + "step": 5765 + }, + { + "epoch": 0.16536741946578012, + "grad_norm": 12.418876725806182, + "learning_rate": 9.527351132985706e-07, + "loss": 0.4878284454345703, + "step": 5770 + }, + { + "epoch": 0.16551071878940732, + "grad_norm": 19.263748264919602, + "learning_rate": 9.526365771232768e-07, + "loss": 0.4557389259338379, + "step": 5775 + }, + { + "epoch": 0.1656540181130345, + "grad_norm": 14.788748238364475, + "learning_rate": 9.525379434489393e-07, + "loss": 0.4800085544586182, + "step": 5780 + }, + { + "epoch": 0.1657973174366617, + "grad_norm": 12.849390509848979, + "learning_rate": 9.524392122968044e-07, + "loss": 0.4816844940185547, + "step": 5785 + }, + { + "epoch": 0.1659406167602889, + "grad_norm": 14.743343852294307, + "learning_rate": 9.523403836881386e-07, + "loss": 0.4785021781921387, + "step": 5790 + }, + { + "epoch": 0.1660839160839161, + "grad_norm": 20.66543163372119, + "learning_rate": 9.522414576442302e-07, + "loss": 0.4852582931518555, + "step": 5795 + }, + { + "epoch": 0.1662272154075433, + "grad_norm": 22.241508986941827, + "learning_rate": 9.521424341863878e-07, + "loss": 0.47209701538085935, + "step": 5800 + }, + { + "epoch": 0.16637051473117048, + "grad_norm": 24.293277406393944, + "learning_rate": 9.520433133359416e-07, + "loss": 0.4853528499603271, + "step": 5805 + }, + { + "epoch": 0.16651381405479765, + "grad_norm": 16.36970001944858, + "learning_rate": 9.519440951142423e-07, + "loss": 0.49168968200683594, + "step": 5810 + }, + { + "epoch": 0.16665711337842484, + "grad_norm": 16.946504210695995, + "learning_rate": 9.518447795426619e-07, + "loss": 0.5057958602905274, + "step": 5815 + }, + { + "epoch": 0.16680041270205204, + "grad_norm": 11.963433060490969, + "learning_rate": 9.517453666425929e-07, + "loss": 0.4944276809692383, + "step": 5820 + }, + { + "epoch": 0.16694371202567923, + "grad_norm": 16.496151253536247, + "learning_rate": 9.516458564354496e-07, + "loss": 0.4931192398071289, + "step": 5825 + }, + { + "epoch": 0.16708701134930642, + "grad_norm": 24.644751802835188, + "learning_rate": 9.515462489426663e-07, + "loss": 0.46903133392333984, + "step": 5830 + }, + { + "epoch": 0.16723031067293362, + "grad_norm": 16.826032402209005, + "learning_rate": 9.514465441856989e-07, + "loss": 0.4624685287475586, + "step": 5835 + }, + { + "epoch": 0.1673736099965608, + "grad_norm": 16.480889807862354, + "learning_rate": 9.513467421860239e-07, + "loss": 0.4528830051422119, + "step": 5840 + }, + { + "epoch": 0.167516909320188, + "grad_norm": 15.671033219663027, + "learning_rate": 9.512468429651391e-07, + "loss": 0.4727164268493652, + "step": 5845 + }, + { + "epoch": 0.1676602086438152, + "grad_norm": 15.153300336014034, + "learning_rate": 9.511468465445629e-07, + "loss": 0.48502411842346194, + "step": 5850 + }, + { + "epoch": 0.1678035079674424, + "grad_norm": 17.39904631100928, + "learning_rate": 9.510467529458348e-07, + "loss": 0.5442911148071289, + "step": 5855 + }, + { + "epoch": 0.1679468072910696, + "grad_norm": 26.30572513878789, + "learning_rate": 9.509465621905153e-07, + "loss": 0.4641237735748291, + "step": 5860 + }, + { + "epoch": 0.16809010661469678, + "grad_norm": 15.18264578309046, + "learning_rate": 9.508462743001855e-07, + "loss": 0.4612721920013428, + "step": 5865 + }, + { + "epoch": 0.16823340593832398, + "grad_norm": 15.661751100318348, + "learning_rate": 9.507458892964481e-07, + "loss": 0.49169044494628905, + "step": 5870 + }, + { + "epoch": 0.16837670526195117, + "grad_norm": 57.573507945879896, + "learning_rate": 9.506454072009258e-07, + "loss": 0.4348124027252197, + "step": 5875 + }, + { + "epoch": 0.16852000458557836, + "grad_norm": 18.588644915167613, + "learning_rate": 9.50544828035263e-07, + "loss": 0.47088146209716797, + "step": 5880 + }, + { + "epoch": 0.16866330390920556, + "grad_norm": 28.999707019299723, + "learning_rate": 9.504441518211244e-07, + "loss": 0.516765546798706, + "step": 5885 + }, + { + "epoch": 0.16880660323283275, + "grad_norm": 23.331357427874934, + "learning_rate": 9.503433785801964e-07, + "loss": 0.4879454612731934, + "step": 5890 + }, + { + "epoch": 0.16894990255645995, + "grad_norm": 17.143352905522324, + "learning_rate": 9.502425083341854e-07, + "loss": 0.49801321029663087, + "step": 5895 + }, + { + "epoch": 0.1690932018800871, + "grad_norm": 13.959041649154456, + "learning_rate": 9.501415411048192e-07, + "loss": 0.4817807197570801, + "step": 5900 + }, + { + "epoch": 0.1692365012037143, + "grad_norm": 19.03583412834793, + "learning_rate": 9.500404769138464e-07, + "loss": 0.45316734313964846, + "step": 5905 + }, + { + "epoch": 0.1693798005273415, + "grad_norm": 18.381737049574866, + "learning_rate": 9.499393157830365e-07, + "loss": 0.4806058406829834, + "step": 5910 + }, + { + "epoch": 0.1695230998509687, + "grad_norm": 14.171550035020406, + "learning_rate": 9.498380577341798e-07, + "loss": 0.47402200698852537, + "step": 5915 + }, + { + "epoch": 0.1696663991745959, + "grad_norm": 18.116083023074474, + "learning_rate": 9.497367027890877e-07, + "loss": 0.4927574634552002, + "step": 5920 + }, + { + "epoch": 0.16980969849822308, + "grad_norm": 13.41644252454998, + "learning_rate": 9.496352509695922e-07, + "loss": 0.45580530166625977, + "step": 5925 + }, + { + "epoch": 0.16995299782185028, + "grad_norm": 24.56464559318852, + "learning_rate": 9.495337022975462e-07, + "loss": 0.5001698493957519, + "step": 5930 + }, + { + "epoch": 0.17009629714547747, + "grad_norm": 11.517582952228478, + "learning_rate": 9.494320567948235e-07, + "loss": 0.48135061264038087, + "step": 5935 + }, + { + "epoch": 0.17023959646910466, + "grad_norm": 15.948159047568362, + "learning_rate": 9.49330314483319e-07, + "loss": 0.4856859683990479, + "step": 5940 + }, + { + "epoch": 0.17038289579273186, + "grad_norm": 17.105555733914674, + "learning_rate": 9.492284753849482e-07, + "loss": 0.4410531997680664, + "step": 5945 + }, + { + "epoch": 0.17052619511635905, + "grad_norm": 19.106794898121972, + "learning_rate": 9.491265395216473e-07, + "loss": 0.5036467552185059, + "step": 5950 + }, + { + "epoch": 0.17066949443998625, + "grad_norm": 22.33099436714888, + "learning_rate": 9.490245069153737e-07, + "loss": 0.5074322700500489, + "step": 5955 + }, + { + "epoch": 0.17081279376361344, + "grad_norm": 13.699254204776265, + "learning_rate": 9.489223775881056e-07, + "loss": 0.4543007850646973, + "step": 5960 + }, + { + "epoch": 0.17095609308724063, + "grad_norm": 16.574555633331414, + "learning_rate": 9.488201515618416e-07, + "loss": 0.48146734237670896, + "step": 5965 + }, + { + "epoch": 0.17109939241086783, + "grad_norm": 22.699078290207854, + "learning_rate": 9.487178288586017e-07, + "loss": 0.48718767166137694, + "step": 5970 + }, + { + "epoch": 0.17124269173449502, + "grad_norm": 12.52785332185837, + "learning_rate": 9.486154095004263e-07, + "loss": 0.5087747573852539, + "step": 5975 + }, + { + "epoch": 0.17138599105812222, + "grad_norm": 11.144830437986492, + "learning_rate": 9.485128935093769e-07, + "loss": 0.4433113098144531, + "step": 5980 + }, + { + "epoch": 0.1715292903817494, + "grad_norm": 17.1383898655658, + "learning_rate": 9.484102809075356e-07, + "loss": 0.5036598682403565, + "step": 5985 + }, + { + "epoch": 0.17167258970537658, + "grad_norm": 19.1821745426877, + "learning_rate": 9.483075717170055e-07, + "loss": 0.4801191329956055, + "step": 5990 + }, + { + "epoch": 0.17181588902900377, + "grad_norm": 22.951830357337563, + "learning_rate": 9.482047659599104e-07, + "loss": 0.4650597095489502, + "step": 5995 + }, + { + "epoch": 0.17195918835263097, + "grad_norm": 12.467650310173038, + "learning_rate": 9.481018636583949e-07, + "loss": 0.49633111953735354, + "step": 6000 + }, + { + "epoch": 0.17195918835263097, + "eval_bfov_iou": 0.7886807541246348, + "eval_bfov_iou@0.1": 0.972, + "eval_bfov_iou@0.25": 0.972, + "eval_bfov_iou@0.5": 0.964, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5428571428571428, + "eval_exact_match": 0.383, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 436.5654, + "eval_samples_per_second": 4.581, + "eval_steps_per_second": 0.144, + "eval_task_acc_absolute_direction_mc": 0.804, + "eval_task_acc_camera_rotation_transform_mc": 0.316, + "eval_task_acc_object_conditioned_reorientation_mc": 0.428, + "eval_task_acc_observer_distance_choice": 0.576, + "eval_task_acc_relative_3d_position_mc": 0.532, + "eval_task_acc_relative_direction_mc": 0.52, + "eval_task_acc_seam_continuity_mc": 0.624, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.972, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.964, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7886807541246348, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 6000 + }, + { + "epoch": 0.17210248767625816, + "grad_norm": 13.28649882982901, + "learning_rate": 9.479988648346242e-07, + "loss": 0.48440990447998045, + "step": 6005 + }, + { + "epoch": 0.17224578699988535, + "grad_norm": 15.699658890833696, + "learning_rate": 9.478957695107849e-07, + "loss": 0.453226375579834, + "step": 6010 + }, + { + "epoch": 0.17238908632351255, + "grad_norm": 36.69164726610978, + "learning_rate": 9.477925777090837e-07, + "loss": 0.48549551963806153, + "step": 6015 + }, + { + "epoch": 0.17253238564713974, + "grad_norm": 30.23864141888512, + "learning_rate": 9.476892894517486e-07, + "loss": 0.47911977767944336, + "step": 6020 + }, + { + "epoch": 0.17267568497076694, + "grad_norm": 17.328657639550798, + "learning_rate": 9.475859047610278e-07, + "loss": 0.47513713836669924, + "step": 6025 + }, + { + "epoch": 0.17281898429439413, + "grad_norm": 44.03242729668975, + "learning_rate": 9.474824236591909e-07, + "loss": 0.5065144538879395, + "step": 6030 + }, + { + "epoch": 0.17296228361802132, + "grad_norm": 46.915800008935015, + "learning_rate": 9.473788461685281e-07, + "loss": 0.4802976608276367, + "step": 6035 + }, + { + "epoch": 0.17310558294164852, + "grad_norm": 11.758954947248682, + "learning_rate": 9.472751723113499e-07, + "loss": 0.4926571846008301, + "step": 6040 + }, + { + "epoch": 0.1732488822652757, + "grad_norm": 17.493925903255754, + "learning_rate": 9.471714021099881e-07, + "loss": 0.4460099220275879, + "step": 6045 + }, + { + "epoch": 0.1733921815889029, + "grad_norm": 33.08841038093934, + "learning_rate": 9.47067535586795e-07, + "loss": 0.5203557968139648, + "step": 6050 + }, + { + "epoch": 0.1735354809125301, + "grad_norm": 36.806470850304706, + "learning_rate": 9.469635727641439e-07, + "loss": 0.48954429626464846, + "step": 6055 + }, + { + "epoch": 0.1736787802361573, + "grad_norm": 22.505183564102115, + "learning_rate": 9.468595136644283e-07, + "loss": 0.4992457389831543, + "step": 6060 + }, + { + "epoch": 0.1738220795597845, + "grad_norm": 16.2503496559608, + "learning_rate": 9.467553583100629e-07, + "loss": 0.5003866672515869, + "step": 6065 + }, + { + "epoch": 0.17396537888341168, + "grad_norm": 15.22972735021795, + "learning_rate": 9.466511067234834e-07, + "loss": 0.5002088069915771, + "step": 6070 + }, + { + "epoch": 0.17410867820703887, + "grad_norm": 13.62213057569805, + "learning_rate": 9.465467589271454e-07, + "loss": 0.469821834564209, + "step": 6075 + }, + { + "epoch": 0.17425197753066607, + "grad_norm": 14.861456340392579, + "learning_rate": 9.464423149435258e-07, + "loss": 0.48299350738525393, + "step": 6080 + }, + { + "epoch": 0.17439527685429324, + "grad_norm": 43.30818328745372, + "learning_rate": 9.463377747951221e-07, + "loss": 0.45112247467041017, + "step": 6085 + }, + { + "epoch": 0.17453857617792043, + "grad_norm": 16.566582445664658, + "learning_rate": 9.462331385044527e-07, + "loss": 0.4682373046875, + "step": 6090 + }, + { + "epoch": 0.17468187550154762, + "grad_norm": 53.08630550124552, + "learning_rate": 9.461284060940561e-07, + "loss": 0.5087890625, + "step": 6095 + }, + { + "epoch": 0.17482517482517482, + "grad_norm": 28.517179397359573, + "learning_rate": 9.460235775864922e-07, + "loss": 0.5002116680145263, + "step": 6100 + }, + { + "epoch": 0.174968474148802, + "grad_norm": 20.494346355257846, + "learning_rate": 9.459186530043414e-07, + "loss": 0.4991103172302246, + "step": 6105 + }, + { + "epoch": 0.1751117734724292, + "grad_norm": 13.180078166684103, + "learning_rate": 9.458136323702047e-07, + "loss": 0.45263004302978516, + "step": 6110 + }, + { + "epoch": 0.1752550727960564, + "grad_norm": 34.69072330908693, + "learning_rate": 9.457085157067034e-07, + "loss": 0.5021364212036132, + "step": 6115 + }, + { + "epoch": 0.1753983721196836, + "grad_norm": 41.84693821616109, + "learning_rate": 9.456033030364803e-07, + "loss": 0.5023571014404297, + "step": 6120 + }, + { + "epoch": 0.1755416714433108, + "grad_norm": 33.988484653778585, + "learning_rate": 9.454979943821985e-07, + "loss": 0.4995841979980469, + "step": 6125 + }, + { + "epoch": 0.17568497076693798, + "grad_norm": 24.779944087582006, + "learning_rate": 9.453925897665416e-07, + "loss": 0.5045446395874024, + "step": 6130 + }, + { + "epoch": 0.17582827009056518, + "grad_norm": 15.193114829620038, + "learning_rate": 9.452870892122139e-07, + "loss": 0.46706762313842776, + "step": 6135 + }, + { + "epoch": 0.17597156941419237, + "grad_norm": 35.674636541899034, + "learning_rate": 9.451814927419407e-07, + "loss": 0.48236522674560545, + "step": 6140 + }, + { + "epoch": 0.17611486873781956, + "grad_norm": 21.324745294330487, + "learning_rate": 9.450758003784676e-07, + "loss": 0.46052942276000974, + "step": 6145 + }, + { + "epoch": 0.17625816806144676, + "grad_norm": 162.50393232738836, + "learning_rate": 9.449700121445612e-07, + "loss": 0.5027780532836914, + "step": 6150 + }, + { + "epoch": 0.17640146738507395, + "grad_norm": 19.001788017172426, + "learning_rate": 9.448641280630083e-07, + "loss": 0.4871206283569336, + "step": 6155 + }, + { + "epoch": 0.17654476670870115, + "grad_norm": 34.82690811955992, + "learning_rate": 9.447581481566167e-07, + "loss": 0.48973236083984373, + "step": 6160 + }, + { + "epoch": 0.17668806603232834, + "grad_norm": 12.303981675363168, + "learning_rate": 9.446520724482146e-07, + "loss": 0.4958535671234131, + "step": 6165 + }, + { + "epoch": 0.17683136535595553, + "grad_norm": 18.29079134095771, + "learning_rate": 9.445459009606514e-07, + "loss": 0.45303921699523925, + "step": 6170 + }, + { + "epoch": 0.1769746646795827, + "grad_norm": 15.798320126499373, + "learning_rate": 9.444396337167961e-07, + "loss": 0.4698214054107666, + "step": 6175 + }, + { + "epoch": 0.1771179640032099, + "grad_norm": 16.75481171107999, + "learning_rate": 9.443332707395393e-07, + "loss": 0.5307960510253906, + "step": 6180 + }, + { + "epoch": 0.1772612633268371, + "grad_norm": 39.85813855785097, + "learning_rate": 9.442268120517919e-07, + "loss": 0.4767946720123291, + "step": 6185 + }, + { + "epoch": 0.17740456265046428, + "grad_norm": 15.573708718392837, + "learning_rate": 9.441202576764852e-07, + "loss": 0.5374834060668945, + "step": 6190 + }, + { + "epoch": 0.17754786197409148, + "grad_norm": 12.191868622294713, + "learning_rate": 9.440136076365712e-07, + "loss": 0.499098539352417, + "step": 6195 + }, + { + "epoch": 0.17769116129771867, + "grad_norm": 29.5301139864622, + "learning_rate": 9.439068619550229e-07, + "loss": 0.47642946243286133, + "step": 6200 + }, + { + "epoch": 0.17783446062134586, + "grad_norm": 16.060477436833025, + "learning_rate": 9.438000206548334e-07, + "loss": 0.5156562805175782, + "step": 6205 + }, + { + "epoch": 0.17797775994497306, + "grad_norm": 14.216962374274436, + "learning_rate": 9.436930837590163e-07, + "loss": 0.47380523681640624, + "step": 6210 + }, + { + "epoch": 0.17812105926860025, + "grad_norm": 16.077837236392618, + "learning_rate": 9.435860512906066e-07, + "loss": 0.4922111988067627, + "step": 6215 + }, + { + "epoch": 0.17826435859222745, + "grad_norm": 13.90826055639149, + "learning_rate": 9.43478923272659e-07, + "loss": 0.49267578125, + "step": 6220 + }, + { + "epoch": 0.17840765791585464, + "grad_norm": 23.047030762831827, + "learning_rate": 9.433716997282493e-07, + "loss": 0.4795839309692383, + "step": 6225 + }, + { + "epoch": 0.17855095723948183, + "grad_norm": 21.74562921097944, + "learning_rate": 9.432643806804737e-07, + "loss": 0.50759916305542, + "step": 6230 + }, + { + "epoch": 0.17869425656310903, + "grad_norm": 13.967881672540251, + "learning_rate": 9.431569661524489e-07, + "loss": 0.46470394134521487, + "step": 6235 + }, + { + "epoch": 0.17883755588673622, + "grad_norm": 13.913467551820755, + "learning_rate": 9.430494561673124e-07, + "loss": 0.47162799835205077, + "step": 6240 + }, + { + "epoch": 0.17898085521036342, + "grad_norm": 15.862245443051068, + "learning_rate": 9.429418507482219e-07, + "loss": 0.5059327125549317, + "step": 6245 + }, + { + "epoch": 0.1791241545339906, + "grad_norm": 15.299191884728724, + "learning_rate": 9.428341499183561e-07, + "loss": 0.49409828186035154, + "step": 6250 + }, + { + "epoch": 0.1792674538576178, + "grad_norm": 15.380544489143828, + "learning_rate": 9.427263537009138e-07, + "loss": 0.5082315921783447, + "step": 6255 + }, + { + "epoch": 0.179410753181245, + "grad_norm": 26.40823680246839, + "learning_rate": 9.426184621191149e-07, + "loss": 0.4538698196411133, + "step": 6260 + }, + { + "epoch": 0.17955405250487216, + "grad_norm": 23.030881501523716, + "learning_rate": 9.425104751961992e-07, + "loss": 0.48288640975952146, + "step": 6265 + }, + { + "epoch": 0.17969735182849936, + "grad_norm": 19.109841559065995, + "learning_rate": 9.424023929554274e-07, + "loss": 0.5139583110809326, + "step": 6270 + }, + { + "epoch": 0.17984065115212655, + "grad_norm": 16.20476554730261, + "learning_rate": 9.42294215420081e-07, + "loss": 0.4764394283294678, + "step": 6275 + }, + { + "epoch": 0.17998395047575375, + "grad_norm": 12.393699017789533, + "learning_rate": 9.421859426134612e-07, + "loss": 0.49099931716918943, + "step": 6280 + }, + { + "epoch": 0.18012724979938094, + "grad_norm": 15.48658877888011, + "learning_rate": 9.420775745588906e-07, + "loss": 0.4753702640533447, + "step": 6285 + }, + { + "epoch": 0.18027054912300813, + "grad_norm": 19.082058402436076, + "learning_rate": 9.419691112797119e-07, + "loss": 0.49472932815551757, + "step": 6290 + }, + { + "epoch": 0.18041384844663533, + "grad_norm": 39.590223517615016, + "learning_rate": 9.418605527992882e-07, + "loss": 0.4945657730102539, + "step": 6295 + }, + { + "epoch": 0.18055714777026252, + "grad_norm": 19.026948491614064, + "learning_rate": 9.417518991410034e-07, + "loss": 0.5134127616882325, + "step": 6300 + }, + { + "epoch": 0.18055714777026252, + "eval_bfov_iou": 0.7939495340237869, + "eval_bfov_iou@0.1": 0.968, + "eval_bfov_iou@0.25": 0.968, + "eval_bfov_iou@0.5": 0.96, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.56, + "eval_exact_match": 0.4005, + "eval_invalid_choice_rate": 0.0005714285714285715, + "eval_runtime": 434.0469, + "eval_samples_per_second": 4.608, + "eval_steps_per_second": 0.145, + "eval_task_acc_absolute_direction_mc": 0.836, + "eval_task_acc_camera_rotation_transform_mc": 0.356, + "eval_task_acc_object_conditioned_reorientation_mc": 0.44, + "eval_task_acc_observer_distance_choice": 0.592, + "eval_task_acc_relative_3d_position_mc": 0.544, + "eval_task_acc_relative_direction_mc": 0.484, + "eval_task_acc_seam_continuity_mc": 0.668, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7939495340237869, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 6300 + }, + { + "epoch": 0.18070044709388972, + "grad_norm": 16.05469313380269, + "learning_rate": 9.416431503282618e-07, + "loss": 0.4571788787841797, + "step": 6305 + }, + { + "epoch": 0.1808437464175169, + "grad_norm": 21.994968464445943, + "learning_rate": 9.415343063844881e-07, + "loss": 0.4860698223114014, + "step": 6310 + }, + { + "epoch": 0.1809870457411441, + "grad_norm": 23.892142919664643, + "learning_rate": 9.414253673331275e-07, + "loss": 0.5197165966033935, + "step": 6315 + }, + { + "epoch": 0.1811303450647713, + "grad_norm": 19.2452433187016, + "learning_rate": 9.413163331976458e-07, + "loss": 0.5070697784423828, + "step": 6320 + }, + { + "epoch": 0.1812736443883985, + "grad_norm": 16.22088289361427, + "learning_rate": 9.412072040015293e-07, + "loss": 0.4667868137359619, + "step": 6325 + }, + { + "epoch": 0.18141694371202569, + "grad_norm": 14.135771631727573, + "learning_rate": 9.410979797682846e-07, + "loss": 0.4634263038635254, + "step": 6330 + }, + { + "epoch": 0.18156024303565288, + "grad_norm": 25.331564687541306, + "learning_rate": 9.409886605214388e-07, + "loss": 0.48778457641601564, + "step": 6335 + }, + { + "epoch": 0.18170354235928007, + "grad_norm": 21.44219753078609, + "learning_rate": 9.408792462845396e-07, + "loss": 0.4784407138824463, + "step": 6340 + }, + { + "epoch": 0.18184684168290727, + "grad_norm": 14.882744168888511, + "learning_rate": 9.407697370811554e-07, + "loss": 0.48533058166503906, + "step": 6345 + }, + { + "epoch": 0.18199014100653446, + "grad_norm": 14.761073596198312, + "learning_rate": 9.406601329348742e-07, + "loss": 0.4552142143249512, + "step": 6350 + }, + { + "epoch": 0.18213344033016163, + "grad_norm": 21.278814111865874, + "learning_rate": 9.405504338693054e-07, + "loss": 0.5118876457214355, + "step": 6355 + }, + { + "epoch": 0.18227673965378882, + "grad_norm": 23.281077865072163, + "learning_rate": 9.404406399080785e-07, + "loss": 0.515137767791748, + "step": 6360 + }, + { + "epoch": 0.18242003897741602, + "grad_norm": 39.75112302574037, + "learning_rate": 9.403307510748431e-07, + "loss": 0.4607226371765137, + "step": 6365 + }, + { + "epoch": 0.1825633383010432, + "grad_norm": 20.216935218033072, + "learning_rate": 9.402207673932696e-07, + "loss": 0.49642367362976075, + "step": 6370 + }, + { + "epoch": 0.1827066376246704, + "grad_norm": 12.229624579062826, + "learning_rate": 9.401106888870489e-07, + "loss": 0.4402345657348633, + "step": 6375 + }, + { + "epoch": 0.1828499369482976, + "grad_norm": 14.615942157676082, + "learning_rate": 9.400005155798921e-07, + "loss": 0.48252573013305666, + "step": 6380 + }, + { + "epoch": 0.1829932362719248, + "grad_norm": 21.154735746160558, + "learning_rate": 9.398902474955308e-07, + "loss": 0.4343718528747559, + "step": 6385 + }, + { + "epoch": 0.18313653559555199, + "grad_norm": 17.644861468565082, + "learning_rate": 9.397798846577169e-07, + "loss": 0.44979658126831057, + "step": 6390 + }, + { + "epoch": 0.18327983491917918, + "grad_norm": 17.913537982512135, + "learning_rate": 9.396694270902232e-07, + "loss": 0.45394139289855956, + "step": 6395 + }, + { + "epoch": 0.18342313424280637, + "grad_norm": 51.430783017321545, + "learning_rate": 9.395588748168421e-07, + "loss": 0.47285938262939453, + "step": 6400 + }, + { + "epoch": 0.18356643356643357, + "grad_norm": 20.047926338989484, + "learning_rate": 9.394482278613871e-07, + "loss": 0.43009281158447266, + "step": 6405 + }, + { + "epoch": 0.18370973289006076, + "grad_norm": 39.821957879803776, + "learning_rate": 9.393374862476918e-07, + "loss": 0.4625079154968262, + "step": 6410 + }, + { + "epoch": 0.18385303221368796, + "grad_norm": 13.368498868497344, + "learning_rate": 9.392266499996102e-07, + "loss": 0.47198801040649413, + "step": 6415 + }, + { + "epoch": 0.18399633153731515, + "grad_norm": 19.712617019702098, + "learning_rate": 9.391157191410166e-07, + "loss": 0.5201051712036133, + "step": 6420 + }, + { + "epoch": 0.18413963086094234, + "grad_norm": 18.900372480978213, + "learning_rate": 9.390046936958058e-07, + "loss": 0.46840634346008303, + "step": 6425 + }, + { + "epoch": 0.18428293018456954, + "grad_norm": 20.292308700994912, + "learning_rate": 9.388935736878931e-07, + "loss": 0.49005465507507323, + "step": 6430 + }, + { + "epoch": 0.18442622950819673, + "grad_norm": 23.254172901078782, + "learning_rate": 9.38782359141214e-07, + "loss": 0.4665557861328125, + "step": 6435 + }, + { + "epoch": 0.18456952883182393, + "grad_norm": 25.99440394248272, + "learning_rate": 9.386710500797244e-07, + "loss": 0.504226541519165, + "step": 6440 + }, + { + "epoch": 0.18471282815545112, + "grad_norm": 14.873801531124357, + "learning_rate": 9.385596465274002e-07, + "loss": 0.494111156463623, + "step": 6445 + }, + { + "epoch": 0.18485612747907829, + "grad_norm": 15.309668660849931, + "learning_rate": 9.384481485082385e-07, + "loss": 0.4625535011291504, + "step": 6450 + }, + { + "epoch": 0.18499942680270548, + "grad_norm": 38.360877944980096, + "learning_rate": 9.38336556046256e-07, + "loss": 0.5041403770446777, + "step": 6455 + }, + { + "epoch": 0.18514272612633267, + "grad_norm": 18.545096730604982, + "learning_rate": 9.382248691654899e-07, + "loss": 0.48190784454345703, + "step": 6460 + }, + { + "epoch": 0.18528602544995987, + "grad_norm": 18.494271443177436, + "learning_rate": 9.381130878899982e-07, + "loss": 0.500686502456665, + "step": 6465 + }, + { + "epoch": 0.18542932477358706, + "grad_norm": 16.29200194692619, + "learning_rate": 9.380012122438586e-07, + "loss": 0.4828601360321045, + "step": 6470 + }, + { + "epoch": 0.18557262409721426, + "grad_norm": 20.280732173741548, + "learning_rate": 9.378892422511692e-07, + "loss": 0.49010868072509767, + "step": 6475 + }, + { + "epoch": 0.18571592342084145, + "grad_norm": 21.74639849653996, + "learning_rate": 9.37777177936049e-07, + "loss": 0.48613510131835935, + "step": 6480 + }, + { + "epoch": 0.18585922274446864, + "grad_norm": 46.05926432910671, + "learning_rate": 9.376650193226366e-07, + "loss": 0.4927687168121338, + "step": 6485 + }, + { + "epoch": 0.18600252206809584, + "grad_norm": 13.87633433523228, + "learning_rate": 9.375527664350915e-07, + "loss": 0.4628766536712646, + "step": 6490 + }, + { + "epoch": 0.18614582139172303, + "grad_norm": 187.33816125232835, + "learning_rate": 9.374404192975932e-07, + "loss": 0.4586909294128418, + "step": 6495 + }, + { + "epoch": 0.18628912071535023, + "grad_norm": 19.258917925971737, + "learning_rate": 9.373279779343415e-07, + "loss": 0.4702129364013672, + "step": 6500 + }, + { + "epoch": 0.18643242003897742, + "grad_norm": 15.626761480786763, + "learning_rate": 9.372154423695567e-07, + "loss": 0.44924297332763674, + "step": 6505 + }, + { + "epoch": 0.18657571936260461, + "grad_norm": 36.46145004405913, + "learning_rate": 9.371028126274789e-07, + "loss": 0.47975893020629884, + "step": 6510 + }, + { + "epoch": 0.1867190186862318, + "grad_norm": 19.063082114106155, + "learning_rate": 9.36990088732369e-07, + "loss": 0.4550337791442871, + "step": 6515 + }, + { + "epoch": 0.186862318009859, + "grad_norm": 70.90891512935599, + "learning_rate": 9.368772707085081e-07, + "loss": 0.5374044895172119, + "step": 6520 + }, + { + "epoch": 0.1870056173334862, + "grad_norm": 31.272122850256682, + "learning_rate": 9.367643585801974e-07, + "loss": 0.45905280113220215, + "step": 6525 + }, + { + "epoch": 0.1871489166571134, + "grad_norm": 40.543189687891086, + "learning_rate": 9.366513523717585e-07, + "loss": 0.4796499252319336, + "step": 6530 + }, + { + "epoch": 0.18729221598074058, + "grad_norm": 14.849073840530394, + "learning_rate": 9.365382521075332e-07, + "loss": 0.49996190071105956, + "step": 6535 + }, + { + "epoch": 0.18743551530436775, + "grad_norm": 21.595822856254824, + "learning_rate": 9.364250578118835e-07, + "loss": 0.5250453472137451, + "step": 6540 + }, + { + "epoch": 0.18757881462799494, + "grad_norm": 16.338651397390777, + "learning_rate": 9.363117695091919e-07, + "loss": 0.5139907836914063, + "step": 6545 + }, + { + "epoch": 0.18772211395162214, + "grad_norm": 19.507197335769774, + "learning_rate": 9.361983872238608e-07, + "loss": 0.4689436912536621, + "step": 6550 + }, + { + "epoch": 0.18786541327524933, + "grad_norm": 26.68957445954551, + "learning_rate": 9.360849109803131e-07, + "loss": 0.5132273674011231, + "step": 6555 + }, + { + "epoch": 0.18800871259887653, + "grad_norm": 14.277448361225062, + "learning_rate": 9.359713408029919e-07, + "loss": 0.4621703624725342, + "step": 6560 + }, + { + "epoch": 0.18815201192250372, + "grad_norm": 17.693685363485496, + "learning_rate": 9.358576767163605e-07, + "loss": 0.5024651050567627, + "step": 6565 + }, + { + "epoch": 0.18829531124613091, + "grad_norm": 41.247528626123575, + "learning_rate": 9.357439187449023e-07, + "loss": 0.49294471740722656, + "step": 6570 + }, + { + "epoch": 0.1884386105697581, + "grad_norm": 31.787740286903823, + "learning_rate": 9.356300669131213e-07, + "loss": 0.4799976348876953, + "step": 6575 + }, + { + "epoch": 0.1885819098933853, + "grad_norm": 15.291514799128311, + "learning_rate": 9.355161212455411e-07, + "loss": 0.48970232009887693, + "step": 6580 + }, + { + "epoch": 0.1887252092170125, + "grad_norm": 17.219161759526077, + "learning_rate": 9.354020817667063e-07, + "loss": 0.48347983360290525, + "step": 6585 + }, + { + "epoch": 0.1888685085406397, + "grad_norm": 15.938731307048997, + "learning_rate": 9.352879485011811e-07, + "loss": 0.46706314086914064, + "step": 6590 + }, + { + "epoch": 0.18901180786426688, + "grad_norm": 20.942589419371796, + "learning_rate": 9.3517372147355e-07, + "loss": 0.45478038787841796, + "step": 6595 + }, + { + "epoch": 0.18915510718789408, + "grad_norm": 24.435934108611328, + "learning_rate": 9.350594007084179e-07, + "loss": 0.469144868850708, + "step": 6600 + }, + { + "epoch": 0.18915510718789408, + "eval_bfov_iou": 0.7624980891910027, + "eval_bfov_iou@0.1": 0.916, + "eval_bfov_iou@0.25": 0.904, + "eval_bfov_iou@0.5": 0.888, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5348571428571428, + "eval_exact_match": 0.3715, + "eval_invalid_choice_rate": 0.001142857142857143, + "eval_runtime": 480.2553, + "eval_samples_per_second": 4.164, + "eval_steps_per_second": 0.131, + "eval_task_acc_absolute_direction_mc": 0.844, + "eval_task_acc_camera_rotation_transform_mc": 0.3, + "eval_task_acc_object_conditioned_reorientation_mc": 0.364, + "eval_task_acc_observer_distance_choice": 0.608, + "eval_task_acc_relative_3d_position_mc": 0.504, + "eval_task_acc_relative_direction_mc": 0.456, + "eval_task_acc_seam_continuity_mc": 0.668, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.916, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.904, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.888, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7624980891910027, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 6600 + }, + { + "epoch": 0.18929840651152127, + "grad_norm": 19.51723859513208, + "learning_rate": 9.349449862304095e-07, + "loss": 0.48018369674682615, + "step": 6605 + }, + { + "epoch": 0.18944170583514847, + "grad_norm": 33.79864576175251, + "learning_rate": 9.348304780641705e-07, + "loss": 0.45242938995361326, + "step": 6610 + }, + { + "epoch": 0.18958500515877566, + "grad_norm": 28.065121846860173, + "learning_rate": 9.347158762343657e-07, + "loss": 0.47193269729614257, + "step": 6615 + }, + { + "epoch": 0.18972830448240285, + "grad_norm": 28.41040961153534, + "learning_rate": 9.34601180765681e-07, + "loss": 0.47458362579345703, + "step": 6620 + }, + { + "epoch": 0.18987160380603005, + "grad_norm": 20.80519019168964, + "learning_rate": 9.344863916828218e-07, + "loss": 0.4692636013031006, + "step": 6625 + }, + { + "epoch": 0.19001490312965721, + "grad_norm": 12.833395744395867, + "learning_rate": 9.343715090105142e-07, + "loss": 0.4746562480926514, + "step": 6630 + }, + { + "epoch": 0.1901582024532844, + "grad_norm": 39.64022547916049, + "learning_rate": 9.342565327735041e-07, + "loss": 0.46120462417602537, + "step": 6635 + }, + { + "epoch": 0.1903015017769116, + "grad_norm": 28.056761946925167, + "learning_rate": 9.341414629965578e-07, + "loss": 0.5181025981903076, + "step": 6640 + }, + { + "epoch": 0.1904448011005388, + "grad_norm": 49.649709299141975, + "learning_rate": 9.340262997044615e-07, + "loss": 0.4850555419921875, + "step": 6645 + }, + { + "epoch": 0.190588100424166, + "grad_norm": 43.30142076894396, + "learning_rate": 9.339110429220214e-07, + "loss": 0.47371797561645507, + "step": 6650 + }, + { + "epoch": 0.19073139974779318, + "grad_norm": 14.13060201775622, + "learning_rate": 9.337956926740645e-07, + "loss": 0.4729037284851074, + "step": 6655 + }, + { + "epoch": 0.19087469907142038, + "grad_norm": 20.2513471216658, + "learning_rate": 9.336802489854374e-07, + "loss": 0.48876585960388186, + "step": 6660 + }, + { + "epoch": 0.19101799839504757, + "grad_norm": 17.519608655419226, + "learning_rate": 9.33564711881007e-07, + "loss": 0.44473724365234374, + "step": 6665 + }, + { + "epoch": 0.19116129771867477, + "grad_norm": 11.799737442150594, + "learning_rate": 9.334490813856601e-07, + "loss": 0.4948561668395996, + "step": 6670 + }, + { + "epoch": 0.19130459704230196, + "grad_norm": 22.240665271281156, + "learning_rate": 9.333333575243039e-07, + "loss": 0.48788065910339357, + "step": 6675 + }, + { + "epoch": 0.19144789636592915, + "grad_norm": 15.770933665388416, + "learning_rate": 9.332175403218658e-07, + "loss": 0.5055879592895508, + "step": 6680 + }, + { + "epoch": 0.19159119568955635, + "grad_norm": 15.459627381517798, + "learning_rate": 9.331016298032928e-07, + "loss": 0.4819929122924805, + "step": 6685 + }, + { + "epoch": 0.19173449501318354, + "grad_norm": 13.512798101186855, + "learning_rate": 9.329856259935524e-07, + "loss": 0.44251384735107424, + "step": 6690 + }, + { + "epoch": 0.19187779433681074, + "grad_norm": 17.382739956570834, + "learning_rate": 9.328695289176323e-07, + "loss": 0.49477672576904297, + "step": 6695 + }, + { + "epoch": 0.19202109366043793, + "grad_norm": 14.994800315292835, + "learning_rate": 9.327533386005398e-07, + "loss": 0.46024656295776367, + "step": 6700 + }, + { + "epoch": 0.19216439298406512, + "grad_norm": 22.39796687281439, + "learning_rate": 9.326370550673028e-07, + "loss": 0.4945563316345215, + "step": 6705 + }, + { + "epoch": 0.19230769230769232, + "grad_norm": 18.407056105110527, + "learning_rate": 9.32520678342969e-07, + "loss": 0.5268344402313232, + "step": 6710 + }, + { + "epoch": 0.1924509916313195, + "grad_norm": 16.0025503681458, + "learning_rate": 9.324042084526063e-07, + "loss": 0.4581875801086426, + "step": 6715 + }, + { + "epoch": 0.1925942909549467, + "grad_norm": 26.419485702690196, + "learning_rate": 9.322876454213027e-07, + "loss": 0.45262556076049804, + "step": 6720 + }, + { + "epoch": 0.19273759027857387, + "grad_norm": 93.48424024031951, + "learning_rate": 9.321709892741657e-07, + "loss": 0.47497334480285647, + "step": 6725 + }, + { + "epoch": 0.19288088960220107, + "grad_norm": 24.17040490190291, + "learning_rate": 9.320542400363238e-07, + "loss": 0.49657535552978516, + "step": 6730 + }, + { + "epoch": 0.19302418892582826, + "grad_norm": 23.702925863593745, + "learning_rate": 9.319373977329247e-07, + "loss": 0.49040675163269043, + "step": 6735 + }, + { + "epoch": 0.19316748824945545, + "grad_norm": 23.77620749942974, + "learning_rate": 9.31820462389137e-07, + "loss": 0.48569841384887696, + "step": 6740 + }, + { + "epoch": 0.19331078757308265, + "grad_norm": 12.846845095143166, + "learning_rate": 9.317034340301486e-07, + "loss": 0.4567368507385254, + "step": 6745 + }, + { + "epoch": 0.19345408689670984, + "grad_norm": 30.04200499860457, + "learning_rate": 9.315863126811676e-07, + "loss": 0.48204989433288575, + "step": 6750 + }, + { + "epoch": 0.19359738622033704, + "grad_norm": 16.907069449500728, + "learning_rate": 9.314690983674223e-07, + "loss": 0.4964712619781494, + "step": 6755 + }, + { + "epoch": 0.19374068554396423, + "grad_norm": 14.241008210009353, + "learning_rate": 9.31351791114161e-07, + "loss": 0.4791990280151367, + "step": 6760 + }, + { + "epoch": 0.19388398486759142, + "grad_norm": 10.93381752842939, + "learning_rate": 9.312343909466519e-07, + "loss": 0.48095178604125977, + "step": 6765 + }, + { + "epoch": 0.19402728419121862, + "grad_norm": 17.21697944762068, + "learning_rate": 9.311168978901833e-07, + "loss": 0.4920661926269531, + "step": 6770 + }, + { + "epoch": 0.1941705835148458, + "grad_norm": 19.859103745435924, + "learning_rate": 9.309993119700636e-07, + "loss": 0.4848301410675049, + "step": 6775 + }, + { + "epoch": 0.194313882838473, + "grad_norm": 16.682334740683956, + "learning_rate": 9.308816332116212e-07, + "loss": 0.44292416572570803, + "step": 6780 + }, + { + "epoch": 0.1944571821621002, + "grad_norm": 17.89546303711239, + "learning_rate": 9.30763861640204e-07, + "loss": 0.44863133430480956, + "step": 6785 + }, + { + "epoch": 0.1946004814857274, + "grad_norm": 19.279236378498393, + "learning_rate": 9.306459972811807e-07, + "loss": 0.4645540237426758, + "step": 6790 + }, + { + "epoch": 0.1947437808093546, + "grad_norm": 13.193309912282118, + "learning_rate": 9.305280401599394e-07, + "loss": 0.5008809566497803, + "step": 6795 + }, + { + "epoch": 0.19488708013298178, + "grad_norm": 25.397767016477346, + "learning_rate": 9.304099903018882e-07, + "loss": 0.4724996566772461, + "step": 6800 + }, + { + "epoch": 0.19503037945660898, + "grad_norm": 25.564612701267297, + "learning_rate": 9.302918477324555e-07, + "loss": 0.48619718551635743, + "step": 6805 + }, + { + "epoch": 0.19517367878023617, + "grad_norm": 15.582754932535481, + "learning_rate": 9.301736124770896e-07, + "loss": 0.4654958724975586, + "step": 6810 + }, + { + "epoch": 0.19531697810386334, + "grad_norm": 20.24967361176894, + "learning_rate": 9.300552845612584e-07, + "loss": 0.4845306873321533, + "step": 6815 + }, + { + "epoch": 0.19546027742749053, + "grad_norm": 31.97739187461764, + "learning_rate": 9.299368640104504e-07, + "loss": 0.5115826606750489, + "step": 6820 + }, + { + "epoch": 0.19560357675111772, + "grad_norm": 18.935418618939433, + "learning_rate": 9.298183508501734e-07, + "loss": 0.47686614990234377, + "step": 6825 + }, + { + "epoch": 0.19574687607474492, + "grad_norm": 29.642864326683927, + "learning_rate": 9.296997451059553e-07, + "loss": 0.46333770751953124, + "step": 6830 + }, + { + "epoch": 0.1958901753983721, + "grad_norm": 21.94178501972612, + "learning_rate": 9.295810468033445e-07, + "loss": 0.46242580413818357, + "step": 6835 + }, + { + "epoch": 0.1960334747219993, + "grad_norm": 16.4636065953138, + "learning_rate": 9.294622559679086e-07, + "loss": 0.4546372413635254, + "step": 6840 + }, + { + "epoch": 0.1961767740456265, + "grad_norm": 26.31272284948762, + "learning_rate": 9.293433726252355e-07, + "loss": 0.4793985843658447, + "step": 6845 + }, + { + "epoch": 0.1963200733692537, + "grad_norm": 19.87319497954334, + "learning_rate": 9.29224396800933e-07, + "loss": 0.47942066192626953, + "step": 6850 + }, + { + "epoch": 0.1964633726928809, + "grad_norm": 27.235688850951913, + "learning_rate": 9.291053285206288e-07, + "loss": 0.4617649555206299, + "step": 6855 + }, + { + "epoch": 0.19660667201650808, + "grad_norm": 21.5620418953853, + "learning_rate": 9.289861678099704e-07, + "loss": 0.460933780670166, + "step": 6860 + }, + { + "epoch": 0.19674997134013528, + "grad_norm": 10.569210213353857, + "learning_rate": 9.288669146946255e-07, + "loss": 0.514802360534668, + "step": 6865 + }, + { + "epoch": 0.19689327066376247, + "grad_norm": 17.729455525114187, + "learning_rate": 9.287475692002814e-07, + "loss": 0.469026517868042, + "step": 6870 + }, + { + "epoch": 0.19703656998738966, + "grad_norm": 20.695984877820287, + "learning_rate": 9.286281313526454e-07, + "loss": 0.5061417102813721, + "step": 6875 + }, + { + "epoch": 0.19717986931101686, + "grad_norm": 29.39798451579697, + "learning_rate": 9.285086011774447e-07, + "loss": 0.46748967170715333, + "step": 6880 + }, + { + "epoch": 0.19732316863464405, + "grad_norm": 26.131804122637032, + "learning_rate": 9.283889787004264e-07, + "loss": 0.4632465362548828, + "step": 6885 + }, + { + "epoch": 0.19746646795827125, + "grad_norm": 21.83346167102836, + "learning_rate": 9.282692639473576e-07, + "loss": 0.4875138759613037, + "step": 6890 + }, + { + "epoch": 0.19760976728189844, + "grad_norm": 13.96887850382924, + "learning_rate": 9.28149456944025e-07, + "loss": 0.4920689582824707, + "step": 6895 + }, + { + "epoch": 0.19775306660552563, + "grad_norm": 17.22091150568239, + "learning_rate": 9.280295577162354e-07, + "loss": 0.5049356460571289, + "step": 6900 + }, + { + "epoch": 0.19775306660552563, + "eval_bfov_iou": 0.7204054317639339, + "eval_bfov_iou@0.1": 0.88, + "eval_bfov_iou@0.25": 0.856, + "eval_bfov_iou@0.5": 0.836, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5371428571428571, + "eval_exact_match": 0.331, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 524.9069, + "eval_samples_per_second": 3.81, + "eval_steps_per_second": 0.12, + "eval_task_acc_absolute_direction_mc": 0.78, + "eval_task_acc_camera_rotation_transform_mc": 0.404, + "eval_task_acc_object_conditioned_reorientation_mc": 0.46, + "eval_task_acc_observer_distance_choice": 0.564, + "eval_task_acc_relative_3d_position_mc": 0.488, + "eval_task_acc_relative_direction_mc": 0.456, + "eval_task_acc_seam_continuity_mc": 0.608, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.88, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.856, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.836, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7204054317639339, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 6900 + }, + { + "epoch": 0.1978963659291528, + "grad_norm": 14.67121160287558, + "learning_rate": 9.279095662898154e-07, + "loss": 0.46758103370666504, + "step": 6905 + }, + { + "epoch": 0.19803966525278, + "grad_norm": 14.113087474986894, + "learning_rate": 9.277894826906114e-07, + "loss": 0.49723081588745116, + "step": 6910 + }, + { + "epoch": 0.1981829645764072, + "grad_norm": 16.033730202269226, + "learning_rate": 9.276693069444899e-07, + "loss": 0.4709041595458984, + "step": 6915 + }, + { + "epoch": 0.19832626390003438, + "grad_norm": 10.433766994319647, + "learning_rate": 9.275490390773366e-07, + "loss": 0.4469902992248535, + "step": 6920 + }, + { + "epoch": 0.19846956322366158, + "grad_norm": 20.049725385367076, + "learning_rate": 9.274286791150581e-07, + "loss": 0.44884638786315917, + "step": 6925 + }, + { + "epoch": 0.19861286254728877, + "grad_norm": 17.869822066740728, + "learning_rate": 9.273082270835797e-07, + "loss": 0.46349363327026366, + "step": 6930 + }, + { + "epoch": 0.19875616187091596, + "grad_norm": 15.775702771752007, + "learning_rate": 9.271876830088475e-07, + "loss": 0.4928903102874756, + "step": 6935 + }, + { + "epoch": 0.19889946119454316, + "grad_norm": 24.63423810990779, + "learning_rate": 9.270670469168264e-07, + "loss": 0.45942344665527346, + "step": 6940 + }, + { + "epoch": 0.19904276051817035, + "grad_norm": 12.600713859186031, + "learning_rate": 9.269463188335025e-07, + "loss": 0.49271697998046876, + "step": 6945 + }, + { + "epoch": 0.19918605984179755, + "grad_norm": 14.234945371343509, + "learning_rate": 9.268254987848803e-07, + "loss": 0.45543460845947265, + "step": 6950 + }, + { + "epoch": 0.19932935916542474, + "grad_norm": 20.36416766346544, + "learning_rate": 9.267045867969851e-07, + "loss": 0.46217756271362304, + "step": 6955 + }, + { + "epoch": 0.19947265848905193, + "grad_norm": 38.36616809051736, + "learning_rate": 9.265835828958614e-07, + "loss": 0.48034420013427737, + "step": 6960 + }, + { + "epoch": 0.19961595781267913, + "grad_norm": 15.442215271387639, + "learning_rate": 9.264624871075742e-07, + "loss": 0.47099857330322265, + "step": 6965 + }, + { + "epoch": 0.19975925713630632, + "grad_norm": 14.14069111437424, + "learning_rate": 9.26341299458207e-07, + "loss": 0.4713392734527588, + "step": 6970 + }, + { + "epoch": 0.19990255645993352, + "grad_norm": 16.649198146355232, + "learning_rate": 9.262200199738647e-07, + "loss": 0.4459673404693604, + "step": 6975 + }, + { + "epoch": 0.2000458557835607, + "grad_norm": 22.63153306739744, + "learning_rate": 9.260986486806708e-07, + "loss": 0.4837819576263428, + "step": 6980 + }, + { + "epoch": 0.2001891551071879, + "grad_norm": 20.703222341404615, + "learning_rate": 9.259771856047691e-07, + "loss": 0.46646652221679685, + "step": 6985 + }, + { + "epoch": 0.2003324544308151, + "grad_norm": 13.832167458177176, + "learning_rate": 9.258556307723231e-07, + "loss": 0.46560983657836913, + "step": 6990 + }, + { + "epoch": 0.20047575375444227, + "grad_norm": 12.459101709134416, + "learning_rate": 9.257339842095158e-07, + "loss": 0.47913780212402346, + "step": 6995 + }, + { + "epoch": 0.20061905307806946, + "grad_norm": 13.858516177354867, + "learning_rate": 9.256122459425504e-07, + "loss": 0.48336095809936525, + "step": 7000 + }, + { + "epoch": 0.20076235240169665, + "grad_norm": 12.455003160217206, + "learning_rate": 9.254904159976496e-07, + "loss": 0.46511125564575195, + "step": 7005 + }, + { + "epoch": 0.20090565172532385, + "grad_norm": 21.723855584718063, + "learning_rate": 9.253684944010558e-07, + "loss": 0.45644245147705076, + "step": 7010 + }, + { + "epoch": 0.20104895104895104, + "grad_norm": 15.571920828435553, + "learning_rate": 9.252464811790312e-07, + "loss": 0.5030141353607178, + "step": 7015 + }, + { + "epoch": 0.20119225037257824, + "grad_norm": 20.741917478625215, + "learning_rate": 9.251243763578578e-07, + "loss": 0.48930983543395995, + "step": 7020 + }, + { + "epoch": 0.20133554969620543, + "grad_norm": 16.384818466336302, + "learning_rate": 9.250021799638373e-07, + "loss": 0.4708984851837158, + "step": 7025 + }, + { + "epoch": 0.20147884901983262, + "grad_norm": 16.466810518411908, + "learning_rate": 9.24879892023291e-07, + "loss": 0.44086060523986814, + "step": 7030 + }, + { + "epoch": 0.20162214834345982, + "grad_norm": 19.321003935574485, + "learning_rate": 9.247575125625602e-07, + "loss": 0.4619112491607666, + "step": 7035 + }, + { + "epoch": 0.201765447667087, + "grad_norm": 62.76136320740223, + "learning_rate": 9.246350416080055e-07, + "loss": 0.47827925682067873, + "step": 7040 + }, + { + "epoch": 0.2019087469907142, + "grad_norm": 21.684176937429864, + "learning_rate": 9.245124791860078e-07, + "loss": 0.4884834289550781, + "step": 7045 + }, + { + "epoch": 0.2020520463143414, + "grad_norm": 24.557992392737503, + "learning_rate": 9.243898253229669e-07, + "loss": 0.5161091327667237, + "step": 7050 + }, + { + "epoch": 0.2021953456379686, + "grad_norm": 14.178472550670474, + "learning_rate": 9.242670800453031e-07, + "loss": 0.47828054428100586, + "step": 7055 + }, + { + "epoch": 0.2023386449615958, + "grad_norm": 24.849984798869905, + "learning_rate": 9.24144243379456e-07, + "loss": 0.49983701705932615, + "step": 7060 + }, + { + "epoch": 0.20248194428522298, + "grad_norm": 47.32883766380881, + "learning_rate": 9.240213153518848e-07, + "loss": 0.4588827610015869, + "step": 7065 + }, + { + "epoch": 0.20262524360885018, + "grad_norm": 13.858740318417743, + "learning_rate": 9.238982959890684e-07, + "loss": 0.4677313804626465, + "step": 7070 + }, + { + "epoch": 0.20276854293247737, + "grad_norm": 15.775036666969813, + "learning_rate": 9.237751853175058e-07, + "loss": 0.46004748344421387, + "step": 7075 + }, + { + "epoch": 0.20291184225610456, + "grad_norm": 71.50367673120778, + "learning_rate": 9.23651983363715e-07, + "loss": 0.47492389678955077, + "step": 7080 + }, + { + "epoch": 0.20305514157973176, + "grad_norm": 14.690730538511888, + "learning_rate": 9.235286901542342e-07, + "loss": 0.47253713607788084, + "step": 7085 + }, + { + "epoch": 0.20319844090335892, + "grad_norm": 13.670196583932153, + "learning_rate": 9.234053057156213e-07, + "loss": 0.4774779319763184, + "step": 7090 + }, + { + "epoch": 0.20334174022698612, + "grad_norm": 23.160865896525372, + "learning_rate": 9.232818300744531e-07, + "loss": 0.4868184566497803, + "step": 7095 + }, + { + "epoch": 0.2034850395506133, + "grad_norm": 14.003144061967639, + "learning_rate": 9.231582632573269e-07, + "loss": 0.4731905937194824, + "step": 7100 + }, + { + "epoch": 0.2036283388742405, + "grad_norm": 14.993985185907485, + "learning_rate": 9.230346052908593e-07, + "loss": 0.46527729034423826, + "step": 7105 + }, + { + "epoch": 0.2037716381978677, + "grad_norm": 20.661487249667246, + "learning_rate": 9.229108562016863e-07, + "loss": 0.47611408233642577, + "step": 7110 + }, + { + "epoch": 0.2039149375214949, + "grad_norm": 18.791582976913954, + "learning_rate": 9.227870160164639e-07, + "loss": 0.4634720802307129, + "step": 7115 + }, + { + "epoch": 0.2040582368451221, + "grad_norm": 14.52605323048179, + "learning_rate": 9.226630847618677e-07, + "loss": 0.4711711883544922, + "step": 7120 + }, + { + "epoch": 0.20420153616874928, + "grad_norm": 12.953302663163573, + "learning_rate": 9.225390624645927e-07, + "loss": 0.49842610359191897, + "step": 7125 + }, + { + "epoch": 0.20434483549237648, + "grad_norm": 17.86630995098794, + "learning_rate": 9.224149491513535e-07, + "loss": 0.4992841243743896, + "step": 7130 + }, + { + "epoch": 0.20448813481600367, + "grad_norm": 21.93266247750687, + "learning_rate": 9.222907448488846e-07, + "loss": 0.518975830078125, + "step": 7135 + }, + { + "epoch": 0.20463143413963086, + "grad_norm": 15.402836325802022, + "learning_rate": 9.221664495839398e-07, + "loss": 0.500742769241333, + "step": 7140 + }, + { + "epoch": 0.20477473346325806, + "grad_norm": 37.408033294574565, + "learning_rate": 9.220420633832926e-07, + "loss": 0.4756328582763672, + "step": 7145 + }, + { + "epoch": 0.20491803278688525, + "grad_norm": 30.25903342692644, + "learning_rate": 9.219175862737362e-07, + "loss": 0.48567638397216795, + "step": 7150 + }, + { + "epoch": 0.20506133211051245, + "grad_norm": 17.552441861641046, + "learning_rate": 9.217930182820832e-07, + "loss": 0.44654231071472167, + "step": 7155 + }, + { + "epoch": 0.20520463143413964, + "grad_norm": 31.553960642189466, + "learning_rate": 9.216683594351659e-07, + "loss": 0.4662157535552979, + "step": 7160 + }, + { + "epoch": 0.20534793075776683, + "grad_norm": 15.63188047064376, + "learning_rate": 9.215436097598361e-07, + "loss": 0.4756485939025879, + "step": 7165 + }, + { + "epoch": 0.20549123008139403, + "grad_norm": 16.929439792572158, + "learning_rate": 9.214187692829651e-07, + "loss": 0.46554107666015626, + "step": 7170 + }, + { + "epoch": 0.20563452940502122, + "grad_norm": 22.98713795492635, + "learning_rate": 9.212938380314442e-07, + "loss": 0.4641261100769043, + "step": 7175 + }, + { + "epoch": 0.2057778287286484, + "grad_norm": 17.147388444880455, + "learning_rate": 9.211688160321835e-07, + "loss": 0.42797250747680665, + "step": 7180 + }, + { + "epoch": 0.20592112805227558, + "grad_norm": 13.628980393739026, + "learning_rate": 9.21043703312113e-07, + "loss": 0.49752178192138674, + "step": 7185 + }, + { + "epoch": 0.20606442737590278, + "grad_norm": 16.92274742074844, + "learning_rate": 9.209184998981828e-07, + "loss": 0.49794654846191405, + "step": 7190 + }, + { + "epoch": 0.20620772669952997, + "grad_norm": 26.563244543093337, + "learning_rate": 9.207932058173614e-07, + "loss": 0.4870181083679199, + "step": 7195 + }, + { + "epoch": 0.20635102602315716, + "grad_norm": 30.59228076797566, + "learning_rate": 9.206678210966379e-07, + "loss": 0.46663079261779783, + "step": 7200 + }, + { + "epoch": 0.20635102602315716, + "eval_bfov_iou": 0.7863954890859952, + "eval_bfov_iou@0.1": 0.948, + "eval_bfov_iou@0.25": 0.932, + "eval_bfov_iou@0.5": 0.924, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.5897142857142857, + "eval_exact_match": 0.245, + "eval_invalid_choice_rate": 0.017142857142857144, + "eval_runtime": 1096.6013, + "eval_samples_per_second": 1.824, + "eval_steps_per_second": 0.057, + "eval_task_acc_absolute_direction_mc": 0.808, + "eval_task_acc_camera_rotation_transform_mc": 0.56, + "eval_task_acc_object_conditioned_reorientation_mc": 0.544, + "eval_task_acc_observer_distance_choice": 0.592, + "eval_task_acc_relative_3d_position_mc": 0.484, + "eval_task_acc_relative_direction_mc": 0.5, + "eval_task_acc_seam_continuity_mc": 0.64, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.948, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.932, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.924, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7863954890859952, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 7200 + }, + { + "epoch": 0.20649432534678436, + "grad_norm": 19.81228431279586, + "learning_rate": 9.205423457630204e-07, + "loss": 0.4537327766418457, + "step": 7205 + }, + { + "epoch": 0.20663762467041155, + "grad_norm": 45.752178247248004, + "learning_rate": 9.204167798435365e-07, + "loss": 0.47133455276489256, + "step": 7210 + }, + { + "epoch": 0.20678092399403875, + "grad_norm": 26.296714459436036, + "learning_rate": 9.202911233652334e-07, + "loss": 0.46477227210998534, + "step": 7215 + }, + { + "epoch": 0.20692422331766594, + "grad_norm": 16.500455184637307, + "learning_rate": 9.20165376355178e-07, + "loss": 0.4517394542694092, + "step": 7220 + }, + { + "epoch": 0.20706752264129313, + "grad_norm": 16.37885269867787, + "learning_rate": 9.200395388404563e-07, + "loss": 0.44724388122558595, + "step": 7225 + }, + { + "epoch": 0.20721082196492033, + "grad_norm": 22.00488794246895, + "learning_rate": 9.199136108481741e-07, + "loss": 0.4753090858459473, + "step": 7230 + }, + { + "epoch": 0.20735412128854752, + "grad_norm": 52.14005584451313, + "learning_rate": 9.197875924054565e-07, + "loss": 0.47364349365234376, + "step": 7235 + }, + { + "epoch": 0.20749742061217472, + "grad_norm": 53.85942218353156, + "learning_rate": 9.196614835394485e-07, + "loss": 0.4734331130981445, + "step": 7240 + }, + { + "epoch": 0.2076407199358019, + "grad_norm": 39.91601335896776, + "learning_rate": 9.19535284277314e-07, + "loss": 0.48821229934692384, + "step": 7245 + }, + { + "epoch": 0.2077840192594291, + "grad_norm": 14.200644092833844, + "learning_rate": 9.194089946462366e-07, + "loss": 0.48743181228637694, + "step": 7250 + }, + { + "epoch": 0.2079273185830563, + "grad_norm": 16.6380325761619, + "learning_rate": 9.192826146734196e-07, + "loss": 0.4543587684631348, + "step": 7255 + }, + { + "epoch": 0.2080706179066835, + "grad_norm": 27.24125960690116, + "learning_rate": 9.191561443860853e-07, + "loss": 0.5159170150756835, + "step": 7260 + }, + { + "epoch": 0.20821391723031069, + "grad_norm": 21.727443700429845, + "learning_rate": 9.190295838114761e-07, + "loss": 0.4394519805908203, + "step": 7265 + }, + { + "epoch": 0.20835721655393785, + "grad_norm": 139.0761106974069, + "learning_rate": 9.189029329768531e-07, + "loss": 0.5036822319030761, + "step": 7270 + }, + { + "epoch": 0.20850051587756505, + "grad_norm": 14.808523846137147, + "learning_rate": 9.187761919094973e-07, + "loss": 0.45519561767578126, + "step": 7275 + }, + { + "epoch": 0.20864381520119224, + "grad_norm": 13.963614937606225, + "learning_rate": 9.186493606367092e-07, + "loss": 0.48427581787109375, + "step": 7280 + }, + { + "epoch": 0.20878711452481943, + "grad_norm": 11.266546445987386, + "learning_rate": 9.185224391858082e-07, + "loss": 0.466748046875, + "step": 7285 + }, + { + "epoch": 0.20893041384844663, + "grad_norm": 23.877434241394067, + "learning_rate": 9.183954275841339e-07, + "loss": 0.4813971519470215, + "step": 7290 + }, + { + "epoch": 0.20907371317207382, + "grad_norm": 14.159484714932102, + "learning_rate": 9.182683258590447e-07, + "loss": 0.4867410182952881, + "step": 7295 + }, + { + "epoch": 0.20921701249570102, + "grad_norm": 20.777516458044772, + "learning_rate": 9.181411340379188e-07, + "loss": 0.484747314453125, + "step": 7300 + }, + { + "epoch": 0.2093603118193282, + "grad_norm": 19.80772486953937, + "learning_rate": 9.180138521481535e-07, + "loss": 0.4966930389404297, + "step": 7305 + }, + { + "epoch": 0.2095036111429554, + "grad_norm": 25.3832324254979, + "learning_rate": 9.178864802171655e-07, + "loss": 0.5027919292449952, + "step": 7310 + }, + { + "epoch": 0.2096469104665826, + "grad_norm": 17.0221609922728, + "learning_rate": 9.177590182723913e-07, + "loss": 0.46949195861816406, + "step": 7315 + }, + { + "epoch": 0.2097902097902098, + "grad_norm": 14.374841640207364, + "learning_rate": 9.176314663412863e-07, + "loss": 0.4752321243286133, + "step": 7320 + }, + { + "epoch": 0.20993350911383699, + "grad_norm": 16.27122930426815, + "learning_rate": 9.175038244513258e-07, + "loss": 0.4454025745391846, + "step": 7325 + }, + { + "epoch": 0.21007680843746418, + "grad_norm": 43.26480191852943, + "learning_rate": 9.173760926300038e-07, + "loss": 0.46703543663024905, + "step": 7330 + }, + { + "epoch": 0.21022010776109137, + "grad_norm": 25.789654446841602, + "learning_rate": 9.172482709048343e-07, + "loss": 0.47612571716308594, + "step": 7335 + }, + { + "epoch": 0.21036340708471857, + "grad_norm": 31.331879491325708, + "learning_rate": 9.171203593033503e-07, + "loss": 0.48381433486938474, + "step": 7340 + }, + { + "epoch": 0.21050670640834576, + "grad_norm": 14.766885978758959, + "learning_rate": 9.169923578531045e-07, + "loss": 0.48297948837280275, + "step": 7345 + }, + { + "epoch": 0.21065000573197296, + "grad_norm": 14.663058850560265, + "learning_rate": 9.168642665816684e-07, + "loss": 0.4730534553527832, + "step": 7350 + }, + { + "epoch": 0.21079330505560015, + "grad_norm": 32.93895931636781, + "learning_rate": 9.167360855166333e-07, + "loss": 0.4767171382904053, + "step": 7355 + }, + { + "epoch": 0.21093660437922734, + "grad_norm": 11.88347698949976, + "learning_rate": 9.1660781468561e-07, + "loss": 0.48899450302124026, + "step": 7360 + }, + { + "epoch": 0.2110799037028545, + "grad_norm": 22.01818001643965, + "learning_rate": 9.164794541162279e-07, + "loss": 0.5050251007080078, + "step": 7365 + }, + { + "epoch": 0.2112232030264817, + "grad_norm": 25.878021522292457, + "learning_rate": 9.163510038361364e-07, + "loss": 0.4814760208129883, + "step": 7370 + }, + { + "epoch": 0.2113665023501089, + "grad_norm": 20.796056854709303, + "learning_rate": 9.162224638730041e-07, + "loss": 0.469334077835083, + "step": 7375 + }, + { + "epoch": 0.2115098016737361, + "grad_norm": 53.33956696049317, + "learning_rate": 9.160938342545187e-07, + "loss": 0.46192193031311035, + "step": 7380 + }, + { + "epoch": 0.21165310099736329, + "grad_norm": 12.787500776815138, + "learning_rate": 9.159651150083874e-07, + "loss": 0.474854564666748, + "step": 7385 + }, + { + "epoch": 0.21179640032099048, + "grad_norm": 29.806828778133454, + "learning_rate": 9.158363061623367e-07, + "loss": 0.48052139282226564, + "step": 7390 + }, + { + "epoch": 0.21193969964461767, + "grad_norm": 13.753204100659337, + "learning_rate": 9.15707407744112e-07, + "loss": 0.4627431869506836, + "step": 7395 + }, + { + "epoch": 0.21208299896824487, + "grad_norm": 25.92404471523998, + "learning_rate": 9.155784197814789e-07, + "loss": 0.4490457057952881, + "step": 7400 + }, + { + "epoch": 0.21222629829187206, + "grad_norm": 14.981386306238784, + "learning_rate": 9.154493423022213e-07, + "loss": 0.4712789535522461, + "step": 7405 + }, + { + "epoch": 0.21236959761549926, + "grad_norm": 23.832380576002905, + "learning_rate": 9.153201753341429e-07, + "loss": 0.46287841796875, + "step": 7410 + }, + { + "epoch": 0.21251289693912645, + "grad_norm": 14.086115495931065, + "learning_rate": 9.151909189050667e-07, + "loss": 0.46623954772949217, + "step": 7415 + }, + { + "epoch": 0.21265619626275364, + "grad_norm": 23.67416142892677, + "learning_rate": 9.150615730428349e-07, + "loss": 0.4114354133605957, + "step": 7420 + }, + { + "epoch": 0.21279949558638084, + "grad_norm": 19.413634350760827, + "learning_rate": 9.149321377753086e-07, + "loss": 0.4728558540344238, + "step": 7425 + }, + { + "epoch": 0.21294279491000803, + "grad_norm": 11.567099832520544, + "learning_rate": 9.148026131303688e-07, + "loss": 0.46999101638793944, + "step": 7430 + }, + { + "epoch": 0.21308609423363523, + "grad_norm": 24.162094858256474, + "learning_rate": 9.146729991359152e-07, + "loss": 0.4835094928741455, + "step": 7435 + }, + { + "epoch": 0.21322939355726242, + "grad_norm": 16.269362474977353, + "learning_rate": 9.145432958198674e-07, + "loss": 0.4901141166687012, + "step": 7440 + }, + { + "epoch": 0.21337269288088961, + "grad_norm": 61.9195224994652, + "learning_rate": 9.144135032101632e-07, + "loss": 0.4695981502532959, + "step": 7445 + }, + { + "epoch": 0.2135159922045168, + "grad_norm": 57.26498904012588, + "learning_rate": 9.142836213347607e-07, + "loss": 0.4846305847167969, + "step": 7450 + }, + { + "epoch": 0.21365929152814397, + "grad_norm": 12.702299737341912, + "learning_rate": 9.141536502216365e-07, + "loss": 0.4942293643951416, + "step": 7455 + }, + { + "epoch": 0.21380259085177117, + "grad_norm": 13.108827682881634, + "learning_rate": 9.14023589898787e-07, + "loss": 0.49108448028564455, + "step": 7460 + }, + { + "epoch": 0.21394589017539836, + "grad_norm": 20.386195808282967, + "learning_rate": 9.138934403942273e-07, + "loss": 0.4766553401947021, + "step": 7465 + }, + { + "epoch": 0.21408918949902556, + "grad_norm": 18.61316404404482, + "learning_rate": 9.13763201735992e-07, + "loss": 0.4868764400482178, + "step": 7470 + }, + { + "epoch": 0.21423248882265275, + "grad_norm": 13.792898307488034, + "learning_rate": 9.136328739521348e-07, + "loss": 0.49263248443603513, + "step": 7475 + }, + { + "epoch": 0.21437578814627994, + "grad_norm": 11.387721468397622, + "learning_rate": 9.135024570707286e-07, + "loss": 0.47518043518066405, + "step": 7480 + }, + { + "epoch": 0.21451908746990714, + "grad_norm": 21.52759150722355, + "learning_rate": 9.133719511198656e-07, + "loss": 0.4827613353729248, + "step": 7485 + }, + { + "epoch": 0.21466238679353433, + "grad_norm": 19.980428684792702, + "learning_rate": 9.132413561276571e-07, + "loss": 0.5279246807098389, + "step": 7490 + }, + { + "epoch": 0.21480568611716153, + "grad_norm": 21.490603203822488, + "learning_rate": 9.131106721222335e-07, + "loss": 0.48525333404541016, + "step": 7495 + }, + { + "epoch": 0.21494898544078872, + "grad_norm": 17.591172147320407, + "learning_rate": 9.129798991317445e-07, + "loss": 0.5012947082519531, + "step": 7500 + }, + { + "epoch": 0.21494898544078872, + "eval_bfov_iou": 0.7688340430246426, + "eval_bfov_iou@0.1": 0.948, + "eval_bfov_iou@0.25": 0.936, + "eval_bfov_iou@0.5": 0.932, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.6348571428571429, + "eval_exact_match": 0.2515, + "eval_invalid_choice_rate": 0.008571428571428572, + "eval_runtime": 809.8467, + "eval_samples_per_second": 2.47, + "eval_steps_per_second": 0.078, + "eval_task_acc_absolute_direction_mc": 0.852, + "eval_task_acc_camera_rotation_transform_mc": 0.668, + "eval_task_acc_object_conditioned_reorientation_mc": 0.572, + "eval_task_acc_observer_distance_choice": 0.596, + "eval_task_acc_relative_3d_position_mc": 0.5, + "eval_task_acc_relative_direction_mc": 0.572, + "eval_task_acc_seam_continuity_mc": 0.684, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.948, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.936, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.932, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7688340430246426, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 7500 + }, + { + "epoch": 0.21509228476441591, + "grad_norm": 14.09139525267072, + "learning_rate": 9.128490371843589e-07, + "loss": 0.48622951507568357, + "step": 7505 + }, + { + "epoch": 0.2152355840880431, + "grad_norm": 16.37711038922507, + "learning_rate": 9.127180863082649e-07, + "loss": 0.4790192604064941, + "step": 7510 + }, + { + "epoch": 0.2153788834116703, + "grad_norm": 20.225435433869247, + "learning_rate": 9.125870465316693e-07, + "loss": 0.4657484531402588, + "step": 7515 + }, + { + "epoch": 0.2155221827352975, + "grad_norm": 15.40992924681378, + "learning_rate": 9.124559178827986e-07, + "loss": 0.5151630878448487, + "step": 7520 + }, + { + "epoch": 0.2156654820589247, + "grad_norm": 19.456170933555338, + "learning_rate": 9.123247003898983e-07, + "loss": 0.4617225170135498, + "step": 7525 + }, + { + "epoch": 0.21580878138255188, + "grad_norm": 17.45966465097033, + "learning_rate": 9.121933940812328e-07, + "loss": 0.47251362800598146, + "step": 7530 + }, + { + "epoch": 0.21595208070617908, + "grad_norm": 16.16949054802237, + "learning_rate": 9.12061998985086e-07, + "loss": 0.492618465423584, + "step": 7535 + }, + { + "epoch": 0.21609538002980627, + "grad_norm": 13.424778946872426, + "learning_rate": 9.119305151297605e-07, + "loss": 0.473355770111084, + "step": 7540 + }, + { + "epoch": 0.21623867935343344, + "grad_norm": 23.614741994757328, + "learning_rate": 9.117989425435784e-07, + "loss": 0.5028592109680176, + "step": 7545 + }, + { + "epoch": 0.21638197867706063, + "grad_norm": 29.953064861795994, + "learning_rate": 9.116672812548807e-07, + "loss": 0.4698647975921631, + "step": 7550 + }, + { + "epoch": 0.21652527800068783, + "grad_norm": 17.717378120228016, + "learning_rate": 9.115355312920275e-07, + "loss": 0.4667954921722412, + "step": 7555 + }, + { + "epoch": 0.21666857732431502, + "grad_norm": 14.558690473178427, + "learning_rate": 9.114036926833984e-07, + "loss": 0.5095792770385742, + "step": 7560 + }, + { + "epoch": 0.21681187664794221, + "grad_norm": 45.149677105413424, + "learning_rate": 9.112717654573914e-07, + "loss": 0.47766361236572263, + "step": 7565 + }, + { + "epoch": 0.2169551759715694, + "grad_norm": 12.333357167098358, + "learning_rate": 9.11139749642424e-07, + "loss": 0.44264726638793944, + "step": 7570 + }, + { + "epoch": 0.2170984752951966, + "grad_norm": 19.452479914749635, + "learning_rate": 9.110076452669328e-07, + "loss": 0.49488401412963867, + "step": 7575 + }, + { + "epoch": 0.2172417746188238, + "grad_norm": 14.559161368752566, + "learning_rate": 9.108754523593736e-07, + "loss": 0.48924827575683594, + "step": 7580 + }, + { + "epoch": 0.217385073942451, + "grad_norm": 12.353786260538008, + "learning_rate": 9.107431709482208e-07, + "loss": 0.4434042453765869, + "step": 7585 + }, + { + "epoch": 0.21752837326607818, + "grad_norm": 23.681710522056388, + "learning_rate": 9.106108010619683e-07, + "loss": 0.47377767562866213, + "step": 7590 + }, + { + "epoch": 0.21767167258970538, + "grad_norm": 22.065571902413968, + "learning_rate": 9.104783427291288e-07, + "loss": 0.49634265899658203, + "step": 7595 + }, + { + "epoch": 0.21781497191333257, + "grad_norm": 19.9969835362856, + "learning_rate": 9.103457959782342e-07, + "loss": 0.4513420104980469, + "step": 7600 + }, + { + "epoch": 0.21795827123695977, + "grad_norm": 10.682187134208858, + "learning_rate": 9.102131608378355e-07, + "loss": 0.4597185134887695, + "step": 7605 + }, + { + "epoch": 0.21810157056058696, + "grad_norm": 14.126234728524073, + "learning_rate": 9.100804373365024e-07, + "loss": 0.45395450592041015, + "step": 7610 + }, + { + "epoch": 0.21824486988421415, + "grad_norm": 16.843862394117586, + "learning_rate": 9.099476255028241e-07, + "loss": 0.4749272346496582, + "step": 7615 + }, + { + "epoch": 0.21838816920784135, + "grad_norm": 24.87934934716334, + "learning_rate": 9.098147253654086e-07, + "loss": 0.46436729431152346, + "step": 7620 + }, + { + "epoch": 0.21853146853146854, + "grad_norm": 16.034255643854358, + "learning_rate": 9.096817369528826e-07, + "loss": 0.5037190437316894, + "step": 7625 + }, + { + "epoch": 0.21867476785509574, + "grad_norm": 19.568107423386586, + "learning_rate": 9.095486602938926e-07, + "loss": 0.5293160438537597, + "step": 7630 + }, + { + "epoch": 0.2188180671787229, + "grad_norm": 33.841097222749205, + "learning_rate": 9.094154954171034e-07, + "loss": 0.4540552616119385, + "step": 7635 + }, + { + "epoch": 0.2189613665023501, + "grad_norm": 20.5028558851386, + "learning_rate": 9.09282242351199e-07, + "loss": 0.4801305294036865, + "step": 7640 + }, + { + "epoch": 0.2191046658259773, + "grad_norm": 51.126982655992045, + "learning_rate": 9.091489011248826e-07, + "loss": 0.5087443351745605, + "step": 7645 + }, + { + "epoch": 0.21924796514960448, + "grad_norm": 12.870021835406313, + "learning_rate": 9.090154717668759e-07, + "loss": 0.4624215602874756, + "step": 7650 + }, + { + "epoch": 0.21939126447323168, + "grad_norm": 16.574666432148366, + "learning_rate": 9.088819543059203e-07, + "loss": 0.47555155754089357, + "step": 7655 + }, + { + "epoch": 0.21953456379685887, + "grad_norm": 13.255513047446346, + "learning_rate": 9.087483487707757e-07, + "loss": 0.43019819259643555, + "step": 7660 + }, + { + "epoch": 0.21967786312048607, + "grad_norm": 10.657741090295442, + "learning_rate": 9.086146551902207e-07, + "loss": 0.44695796966552737, + "step": 7665 + }, + { + "epoch": 0.21982116244411326, + "grad_norm": 15.374892654315373, + "learning_rate": 9.084808735930539e-07, + "loss": 0.49388895034790037, + "step": 7670 + }, + { + "epoch": 0.21996446176774045, + "grad_norm": 20.556474615766824, + "learning_rate": 9.083470040080916e-07, + "loss": 0.51600341796875, + "step": 7675 + }, + { + "epoch": 0.22010776109136765, + "grad_norm": 33.72987320168669, + "learning_rate": 9.0821304646417e-07, + "loss": 0.48788156509399416, + "step": 7680 + }, + { + "epoch": 0.22025106041499484, + "grad_norm": 46.64254400351621, + "learning_rate": 9.080790009901437e-07, + "loss": 0.4891310691833496, + "step": 7685 + }, + { + "epoch": 0.22039435973862204, + "grad_norm": 15.36326110699949, + "learning_rate": 9.079448676148865e-07, + "loss": 0.4849270820617676, + "step": 7690 + }, + { + "epoch": 0.22053765906224923, + "grad_norm": 24.555860537997653, + "learning_rate": 9.078106463672909e-07, + "loss": 0.43263258934021, + "step": 7695 + }, + { + "epoch": 0.22068095838587642, + "grad_norm": 19.008369559606667, + "learning_rate": 9.076763372762688e-07, + "loss": 0.45667591094970705, + "step": 7700 + }, + { + "epoch": 0.22082425770950362, + "grad_norm": 26.865827827680757, + "learning_rate": 9.075419403707505e-07, + "loss": 0.45710954666137693, + "step": 7705 + }, + { + "epoch": 0.2209675570331308, + "grad_norm": 28.945710724425386, + "learning_rate": 9.074074556796854e-07, + "loss": 0.4640812873840332, + "step": 7710 + }, + { + "epoch": 0.221110856356758, + "grad_norm": 97.40509956940498, + "learning_rate": 9.07272883232042e-07, + "loss": 0.4634847640991211, + "step": 7715 + }, + { + "epoch": 0.2212541556803852, + "grad_norm": 17.003926613138553, + "learning_rate": 9.071382230568075e-07, + "loss": 0.47771611213684084, + "step": 7720 + }, + { + "epoch": 0.2213974550040124, + "grad_norm": 19.159538609198854, + "learning_rate": 9.070034751829878e-07, + "loss": 0.47121219635009765, + "step": 7725 + }, + { + "epoch": 0.22154075432763956, + "grad_norm": 18.529614401451784, + "learning_rate": 9.068686396396082e-07, + "loss": 0.5034384727478027, + "step": 7730 + }, + { + "epoch": 0.22168405365126675, + "grad_norm": 14.068885700577145, + "learning_rate": 9.067337164557126e-07, + "loss": 0.4271847724914551, + "step": 7735 + }, + { + "epoch": 0.22182735297489395, + "grad_norm": 24.319709309456822, + "learning_rate": 9.065987056603637e-07, + "loss": 0.45923852920532227, + "step": 7740 + }, + { + "epoch": 0.22197065229852114, + "grad_norm": 11.65652627183937, + "learning_rate": 9.064636072826431e-07, + "loss": 0.45700559616088865, + "step": 7745 + }, + { + "epoch": 0.22211395162214834, + "grad_norm": 20.827609949330316, + "learning_rate": 9.063284213516514e-07, + "loss": 0.46802310943603515, + "step": 7750 + }, + { + "epoch": 0.22225725094577553, + "grad_norm": 18.356202961632462, + "learning_rate": 9.06193147896508e-07, + "loss": 0.47342476844787595, + "step": 7755 + }, + { + "epoch": 0.22240055026940272, + "grad_norm": 15.19206674313907, + "learning_rate": 9.060577869463511e-07, + "loss": 0.490079927444458, + "step": 7760 + }, + { + "epoch": 0.22254384959302992, + "grad_norm": 20.77204232596273, + "learning_rate": 9.059223385303378e-07, + "loss": 0.4362484931945801, + "step": 7765 + }, + { + "epoch": 0.2226871489166571, + "grad_norm": 71.27568332370348, + "learning_rate": 9.057868026776441e-07, + "loss": 0.4878055572509766, + "step": 7770 + }, + { + "epoch": 0.2228304482402843, + "grad_norm": 17.217259364184322, + "learning_rate": 9.056511794174647e-07, + "loss": 0.48216638565063474, + "step": 7775 + }, + { + "epoch": 0.2229737475639115, + "grad_norm": 44.59598855128162, + "learning_rate": 9.055154687790132e-07, + "loss": 0.4633878231048584, + "step": 7780 + }, + { + "epoch": 0.2231170468875387, + "grad_norm": 24.723978928016702, + "learning_rate": 9.053796707915219e-07, + "loss": 0.49848089218139646, + "step": 7785 + }, + { + "epoch": 0.2232603462111659, + "grad_norm": 19.073092819115217, + "learning_rate": 9.052437854842421e-07, + "loss": 0.4851548194885254, + "step": 7790 + }, + { + "epoch": 0.22340364553479308, + "grad_norm": 16.523295650425414, + "learning_rate": 9.051078128864439e-07, + "loss": 0.4466727256774902, + "step": 7795 + }, + { + "epoch": 0.22354694485842028, + "grad_norm": 22.363779805198806, + "learning_rate": 9.049717530274162e-07, + "loss": 0.4677853584289551, + "step": 7800 + }, + { + "epoch": 0.22354694485842028, + "eval_bfov_iou": 0.7850526292769187, + "eval_bfov_iou@0.1": 0.968, + "eval_bfov_iou@0.25": 0.96, + "eval_bfov_iou@0.5": 0.952, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.6068571428571429, + "eval_exact_match": 0.2785, + "eval_invalid_choice_rate": 0.0, + "eval_runtime": 631.2393, + "eval_samples_per_second": 3.168, + "eval_steps_per_second": 0.1, + "eval_task_acc_absolute_direction_mc": 0.876, + "eval_task_acc_camera_rotation_transform_mc": 0.584, + "eval_task_acc_object_conditioned_reorientation_mc": 0.504, + "eval_task_acc_observer_distance_choice": 0.576, + "eval_task_acc_relative_3d_position_mc": 0.508, + "eval_task_acc_relative_direction_mc": 0.528, + "eval_task_acc_seam_continuity_mc": 0.672, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.968, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.952, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7850526292769187, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 7800 + }, + { + "epoch": 0.22369024418204747, + "grad_norm": 18.09622059670904, + "learning_rate": 9.048356059364664e-07, + "loss": 0.49361138343811034, + "step": 7805 + }, + { + "epoch": 0.22383354350567466, + "grad_norm": 21.024202532117737, + "learning_rate": 9.04699371642921e-07, + "loss": 0.5028865814208985, + "step": 7810 + }, + { + "epoch": 0.22397684282930186, + "grad_norm": 22.511302494184584, + "learning_rate": 9.045630501761252e-07, + "loss": 0.4757694244384766, + "step": 7815 + }, + { + "epoch": 0.22412014215292902, + "grad_norm": 20.400748074694977, + "learning_rate": 9.044266415654431e-07, + "loss": 0.45992727279663087, + "step": 7820 + }, + { + "epoch": 0.22426344147655622, + "grad_norm": 27.322855905497345, + "learning_rate": 9.042901458402573e-07, + "loss": 0.48706493377685545, + "step": 7825 + }, + { + "epoch": 0.2244067408001834, + "grad_norm": 12.646892675273781, + "learning_rate": 9.041535630299695e-07, + "loss": 0.43868389129638674, + "step": 7830 + }, + { + "epoch": 0.2245500401238106, + "grad_norm": 14.066305788851444, + "learning_rate": 9.040168931639998e-07, + "loss": 0.44563984870910645, + "step": 7835 + }, + { + "epoch": 0.2246933394474378, + "grad_norm": 24.518569136289518, + "learning_rate": 9.038801362717873e-07, + "loss": 0.4728818893432617, + "step": 7840 + }, + { + "epoch": 0.224836638771065, + "grad_norm": 16.253362861586517, + "learning_rate": 9.037432923827899e-07, + "loss": 0.4454965591430664, + "step": 7845 + }, + { + "epoch": 0.2249799380946922, + "grad_norm": 35.457978357521526, + "learning_rate": 9.036063615264838e-07, + "loss": 0.46613445281982424, + "step": 7850 + }, + { + "epoch": 0.22512323741831938, + "grad_norm": 16.82127347623105, + "learning_rate": 9.034693437323646e-07, + "loss": 0.4794048309326172, + "step": 7855 + }, + { + "epoch": 0.22526653674194658, + "grad_norm": 12.818457944977713, + "learning_rate": 9.033322390299461e-07, + "loss": 0.47777886390686036, + "step": 7860 + }, + { + "epoch": 0.22540983606557377, + "grad_norm": 228.28649591503566, + "learning_rate": 9.031950474487608e-07, + "loss": 0.472057580947876, + "step": 7865 + }, + { + "epoch": 0.22555313538920096, + "grad_norm": 33.42133370417481, + "learning_rate": 9.030577690183605e-07, + "loss": 0.4758355140686035, + "step": 7870 + }, + { + "epoch": 0.22569643471282816, + "grad_norm": 17.14582565104984, + "learning_rate": 9.029204037683151e-07, + "loss": 0.43082609176635744, + "step": 7875 + }, + { + "epoch": 0.22583973403645535, + "grad_norm": 19.395853263128554, + "learning_rate": 9.027829517282133e-07, + "loss": 0.4908616542816162, + "step": 7880 + }, + { + "epoch": 0.22598303336008255, + "grad_norm": 31.923750407010814, + "learning_rate": 9.026454129276628e-07, + "loss": 0.42383298873901365, + "step": 7885 + }, + { + "epoch": 0.22612633268370974, + "grad_norm": 19.176496818675165, + "learning_rate": 9.025077873962899e-07, + "loss": 0.47570023536682127, + "step": 7890 + }, + { + "epoch": 0.22626963200733693, + "grad_norm": 16.94951802670471, + "learning_rate": 9.023700751637393e-07, + "loss": 0.47547216415405275, + "step": 7895 + }, + { + "epoch": 0.22641293133096413, + "grad_norm": 15.944112183565133, + "learning_rate": 9.022322762596746e-07, + "loss": 0.5029335021972656, + "step": 7900 + }, + { + "epoch": 0.22655623065459132, + "grad_norm": 12.621456367411607, + "learning_rate": 9.020943907137779e-07, + "loss": 0.4632993698120117, + "step": 7905 + }, + { + "epoch": 0.2266995299782185, + "grad_norm": 13.96934988163023, + "learning_rate": 9.019564185557503e-07, + "loss": 0.4971011161804199, + "step": 7910 + }, + { + "epoch": 0.22684282930184568, + "grad_norm": 15.550369238287765, + "learning_rate": 9.01818359815311e-07, + "loss": 0.48368287086486816, + "step": 7915 + }, + { + "epoch": 0.22698612862547288, + "grad_norm": 70.28721780737617, + "learning_rate": 9.016802145221989e-07, + "loss": 0.47428140640258787, + "step": 7920 + }, + { + "epoch": 0.22712942794910007, + "grad_norm": 15.788669148943411, + "learning_rate": 9.015419827061701e-07, + "loss": 0.5231688976287842, + "step": 7925 + }, + { + "epoch": 0.22727272727272727, + "grad_norm": 14.515766090638314, + "learning_rate": 9.014036643970003e-07, + "loss": 0.44630908966064453, + "step": 7930 + }, + { + "epoch": 0.22741602659635446, + "grad_norm": 18.3942398768572, + "learning_rate": 9.012652596244839e-07, + "loss": 0.491472053527832, + "step": 7935 + }, + { + "epoch": 0.22755932591998165, + "grad_norm": 17.297030209270044, + "learning_rate": 9.011267684184332e-07, + "loss": 0.46556901931762695, + "step": 7940 + }, + { + "epoch": 0.22770262524360885, + "grad_norm": 16.745865545677127, + "learning_rate": 9.009881908086798e-07, + "loss": 0.4692821502685547, + "step": 7945 + }, + { + "epoch": 0.22784592456723604, + "grad_norm": 50.66737299663521, + "learning_rate": 9.008495268250737e-07, + "loss": 0.4648386001586914, + "step": 7950 + }, + { + "epoch": 0.22798922389086324, + "grad_norm": 12.180393752279416, + "learning_rate": 9.007107764974832e-07, + "loss": 0.4748466968536377, + "step": 7955 + }, + { + "epoch": 0.22813252321449043, + "grad_norm": 25.206454369588712, + "learning_rate": 9.005719398557959e-07, + "loss": 0.4971724510192871, + "step": 7960 + }, + { + "epoch": 0.22827582253811762, + "grad_norm": 14.615444739658566, + "learning_rate": 9.004330169299172e-07, + "loss": 0.4825188636779785, + "step": 7965 + }, + { + "epoch": 0.22841912186174482, + "grad_norm": 13.625669786766968, + "learning_rate": 9.002940077497716e-07, + "loss": 0.46204404830932616, + "step": 7970 + }, + { + "epoch": 0.228562421185372, + "grad_norm": 17.10803148883589, + "learning_rate": 9.001549123453019e-07, + "loss": 0.4774447441101074, + "step": 7975 + }, + { + "epoch": 0.2287057205089992, + "grad_norm": 17.539333473761943, + "learning_rate": 9.000157307464695e-07, + "loss": 0.4760782241821289, + "step": 7980 + }, + { + "epoch": 0.2288490198326264, + "grad_norm": 18.097374798443266, + "learning_rate": 8.998764629832549e-07, + "loss": 0.49587416648864746, + "step": 7985 + }, + { + "epoch": 0.2289923191562536, + "grad_norm": 47.06718461052614, + "learning_rate": 8.997371090856563e-07, + "loss": 0.4522270202636719, + "step": 7990 + }, + { + "epoch": 0.2291356184798808, + "grad_norm": 36.15219002492128, + "learning_rate": 8.99597669083691e-07, + "loss": 0.4705718994140625, + "step": 7995 + }, + { + "epoch": 0.22927891780350798, + "grad_norm": 12.987662052136328, + "learning_rate": 8.994581430073948e-07, + "loss": 0.48763608932495117, + "step": 8000 + }, + { + "epoch": 0.22942221712713515, + "grad_norm": 15.693673656205307, + "learning_rate": 8.993185308868221e-07, + "loss": 0.4764582633972168, + "step": 8005 + }, + { + "epoch": 0.22956551645076234, + "grad_norm": 14.660575828313545, + "learning_rate": 8.991788327520453e-07, + "loss": 0.46617679595947265, + "step": 8010 + }, + { + "epoch": 0.22970881577438954, + "grad_norm": 21.187429939075123, + "learning_rate": 8.990390486331559e-07, + "loss": 0.45303869247436523, + "step": 8015 + }, + { + "epoch": 0.22985211509801673, + "grad_norm": 13.934982928745958, + "learning_rate": 8.98899178560264e-07, + "loss": 0.4778312683105469, + "step": 8020 + }, + { + "epoch": 0.22999541442164392, + "grad_norm": 29.665921120997748, + "learning_rate": 8.987592225634974e-07, + "loss": 0.47497758865356443, + "step": 8025 + }, + { + "epoch": 0.23013871374527112, + "grad_norm": 29.754297786008596, + "learning_rate": 8.986191806730036e-07, + "loss": 0.47322511672973633, + "step": 8030 + }, + { + "epoch": 0.2302820130688983, + "grad_norm": 14.954347788062814, + "learning_rate": 8.984790529189476e-07, + "loss": 0.48627634048461915, + "step": 8035 + }, + { + "epoch": 0.2304253123925255, + "grad_norm": 109.14222033616524, + "learning_rate": 8.983388393315135e-07, + "loss": 0.44346179962158205, + "step": 8040 + }, + { + "epoch": 0.2305686117161527, + "grad_norm": 25.80223095072129, + "learning_rate": 8.981985399409033e-07, + "loss": 0.5121284008026123, + "step": 8045 + }, + { + "epoch": 0.2307119110397799, + "grad_norm": 22.32739832213263, + "learning_rate": 8.980581547773381e-07, + "loss": 0.46355619430541994, + "step": 8050 + }, + { + "epoch": 0.2308552103634071, + "grad_norm": 28.0795803600872, + "learning_rate": 8.979176838710571e-07, + "loss": 0.42739181518554686, + "step": 8055 + }, + { + "epoch": 0.23099850968703428, + "grad_norm": 17.873436141276347, + "learning_rate": 8.977771272523182e-07, + "loss": 0.47932186126708987, + "step": 8060 + }, + { + "epoch": 0.23114180901066148, + "grad_norm": 11.598109066090313, + "learning_rate": 8.976364849513976e-07, + "loss": 0.45596818923950194, + "step": 8065 + }, + { + "epoch": 0.23128510833428867, + "grad_norm": 16.769315762714637, + "learning_rate": 8.9749575699859e-07, + "loss": 0.4895799160003662, + "step": 8070 + }, + { + "epoch": 0.23142840765791586, + "grad_norm": 15.657390056661146, + "learning_rate": 8.973549434242085e-07, + "loss": 0.4412865161895752, + "step": 8075 + }, + { + "epoch": 0.23157170698154306, + "grad_norm": 12.17511972381951, + "learning_rate": 8.972140442585847e-07, + "loss": 0.46314077377319335, + "step": 8080 + }, + { + "epoch": 0.23171500630517025, + "grad_norm": 21.766944276658112, + "learning_rate": 8.970730595320688e-07, + "loss": 0.4506492614746094, + "step": 8085 + }, + { + "epoch": 0.23185830562879745, + "grad_norm": 24.013349690156456, + "learning_rate": 8.969319892750289e-07, + "loss": 0.48956913948059083, + "step": 8090 + }, + { + "epoch": 0.2320016049524246, + "grad_norm": 17.435789664377396, + "learning_rate": 8.967908335178523e-07, + "loss": 0.4891559600830078, + "step": 8095 + }, + { + "epoch": 0.2321449042760518, + "grad_norm": 19.96899811167346, + "learning_rate": 8.966495922909441e-07, + "loss": 0.45986008644104004, + "step": 8100 + }, + { + "epoch": 0.2321449042760518, + "eval_bfov_iou": 0.7811897174902934, + "eval_bfov_iou@0.1": 0.94, + "eval_bfov_iou@0.25": 0.924, + "eval_bfov_iou@0.5": 0.916, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.6131428571428571, + "eval_exact_match": 0.2455, + "eval_invalid_choice_rate": 0.013142857142857144, + "eval_runtime": 582.7009, + "eval_samples_per_second": 3.432, + "eval_steps_per_second": 0.108, + "eval_task_acc_absolute_direction_mc": 0.86, + "eval_task_acc_camera_rotation_transform_mc": 0.668, + "eval_task_acc_object_conditioned_reorientation_mc": 0.48, + "eval_task_acc_observer_distance_choice": 0.564, + "eval_task_acc_relative_3d_position_mc": 0.52, + "eval_task_acc_relative_direction_mc": 0.564, + "eval_task_acc_seam_continuity_mc": 0.636, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.94, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.924, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.916, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7811897174902934, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 8100 + }, + { + "epoch": 0.232288203599679, + "grad_norm": 11.54013081918025, + "learning_rate": 8.965082656247278e-07, + "loss": 0.48349819183349607, + "step": 8105 + }, + { + "epoch": 0.2324315029233062, + "grad_norm": 17.909579401329232, + "learning_rate": 8.96366853549646e-07, + "loss": 0.4877286911010742, + "step": 8110 + }, + { + "epoch": 0.2325748022469334, + "grad_norm": 22.569871204287725, + "learning_rate": 8.962253560961587e-07, + "loss": 0.4988869667053223, + "step": 8115 + }, + { + "epoch": 0.23271810157056058, + "grad_norm": 19.72923089515704, + "learning_rate": 8.960837732947452e-07, + "loss": 0.46856842041015623, + "step": 8120 + }, + { + "epoch": 0.23286140089418778, + "grad_norm": 14.89570880920654, + "learning_rate": 8.959421051759026e-07, + "loss": 0.46255922317504883, + "step": 8125 + }, + { + "epoch": 0.23300470021781497, + "grad_norm": 27.175062529032008, + "learning_rate": 8.958003517701466e-07, + "loss": 0.461656379699707, + "step": 8130 + }, + { + "epoch": 0.23314799954144216, + "grad_norm": 21.393186946998423, + "learning_rate": 8.956585131080112e-07, + "loss": 0.4745144844055176, + "step": 8135 + }, + { + "epoch": 0.23329129886506936, + "grad_norm": 17.796693068980623, + "learning_rate": 8.955165892200489e-07, + "loss": 0.4491474151611328, + "step": 8140 + }, + { + "epoch": 0.23343459818869655, + "grad_norm": 12.03701570338103, + "learning_rate": 8.953745801368304e-07, + "loss": 0.4968195915222168, + "step": 8145 + }, + { + "epoch": 0.23357789751232375, + "grad_norm": 29.714896795402883, + "learning_rate": 8.952324858889447e-07, + "loss": 0.46849913597106935, + "step": 8150 + }, + { + "epoch": 0.23372119683595094, + "grad_norm": 18.179066519863106, + "learning_rate": 8.950903065069994e-07, + "loss": 0.5355954170227051, + "step": 8155 + }, + { + "epoch": 0.23386449615957813, + "grad_norm": 24.70456664604375, + "learning_rate": 8.949480420216203e-07, + "loss": 0.46390862464904786, + "step": 8160 + }, + { + "epoch": 0.23400779548320533, + "grad_norm": 19.67902066885664, + "learning_rate": 8.948056924634515e-07, + "loss": 0.449643611907959, + "step": 8165 + }, + { + "epoch": 0.23415109480683252, + "grad_norm": 25.95841536803472, + "learning_rate": 8.946632578631554e-07, + "loss": 0.4417112827301025, + "step": 8170 + }, + { + "epoch": 0.23429439413045972, + "grad_norm": 14.80445701844591, + "learning_rate": 8.945207382514127e-07, + "loss": 0.47973408699035647, + "step": 8175 + }, + { + "epoch": 0.2344376934540869, + "grad_norm": 20.41631447135843, + "learning_rate": 8.943781336589226e-07, + "loss": 0.45940656661987306, + "step": 8180 + }, + { + "epoch": 0.23458099277771408, + "grad_norm": 23.671575801102282, + "learning_rate": 8.942354441164026e-07, + "loss": 0.47678661346435547, + "step": 8185 + }, + { + "epoch": 0.23472429210134127, + "grad_norm": 17.85598722763053, + "learning_rate": 8.94092669654588e-07, + "loss": 0.43843903541564944, + "step": 8190 + }, + { + "epoch": 0.23486759142496846, + "grad_norm": 14.465324644579402, + "learning_rate": 8.939498103042331e-07, + "loss": 0.4862179756164551, + "step": 8195 + }, + { + "epoch": 0.23501089074859566, + "grad_norm": 12.9732190352165, + "learning_rate": 8.938068660961101e-07, + "loss": 0.4741826057434082, + "step": 8200 + }, + { + "epoch": 0.23515419007222285, + "grad_norm": 18.881537488979525, + "learning_rate": 8.936638370610095e-07, + "loss": 0.4815347671508789, + "step": 8205 + }, + { + "epoch": 0.23529748939585005, + "grad_norm": 17.489426599739538, + "learning_rate": 8.935207232297401e-07, + "loss": 0.43060908317565916, + "step": 8210 + }, + { + "epoch": 0.23544078871947724, + "grad_norm": 20.097370129876655, + "learning_rate": 8.93377524633129e-07, + "loss": 0.4443682670593262, + "step": 8215 + }, + { + "epoch": 0.23558408804310443, + "grad_norm": 12.840425370389312, + "learning_rate": 8.932342413020216e-07, + "loss": 0.46693859100341795, + "step": 8220 + }, + { + "epoch": 0.23572738736673163, + "grad_norm": 14.04772879116583, + "learning_rate": 8.930908732672812e-07, + "loss": 0.4784817695617676, + "step": 8225 + }, + { + "epoch": 0.23587068669035882, + "grad_norm": 21.445749130419035, + "learning_rate": 8.9294742055979e-07, + "loss": 0.4746267318725586, + "step": 8230 + }, + { + "epoch": 0.23601398601398602, + "grad_norm": 18.83448095924583, + "learning_rate": 8.928038832104478e-07, + "loss": 0.49289646148681643, + "step": 8235 + }, + { + "epoch": 0.2361572853376132, + "grad_norm": 16.800494895375163, + "learning_rate": 8.926602612501731e-07, + "loss": 0.4584263801574707, + "step": 8240 + }, + { + "epoch": 0.2363005846612404, + "grad_norm": 18.748589913165464, + "learning_rate": 8.925165547099023e-07, + "loss": 0.48039822578430175, + "step": 8245 + }, + { + "epoch": 0.2364438839848676, + "grad_norm": 25.608273906680587, + "learning_rate": 8.923727636205902e-07, + "loss": 0.48033742904663085, + "step": 8250 + }, + { + "epoch": 0.2365871833084948, + "grad_norm": 12.185458971235846, + "learning_rate": 8.922288880132098e-07, + "loss": 0.4634209632873535, + "step": 8255 + }, + { + "epoch": 0.23673048263212199, + "grad_norm": 20.08456013643825, + "learning_rate": 8.920849279187521e-07, + "loss": 0.46299166679382325, + "step": 8260 + }, + { + "epoch": 0.23687378195574918, + "grad_norm": 15.907776940211532, + "learning_rate": 8.919408833682266e-07, + "loss": 0.4725973129272461, + "step": 8265 + }, + { + "epoch": 0.23701708127937637, + "grad_norm": 11.25020654090466, + "learning_rate": 8.917967543926608e-07, + "loss": 0.47246594429016114, + "step": 8270 + }, + { + "epoch": 0.23716038060300354, + "grad_norm": 18.04138750094888, + "learning_rate": 8.916525410231004e-07, + "loss": 0.49103736877441406, + "step": 8275 + }, + { + "epoch": 0.23730367992663073, + "grad_norm": 17.878156164637062, + "learning_rate": 8.915082432906096e-07, + "loss": 0.4955018997192383, + "step": 8280 + }, + { + "epoch": 0.23744697925025793, + "grad_norm": 28.599481696710082, + "learning_rate": 8.913638612262701e-07, + "loss": 0.47287607192993164, + "step": 8285 + }, + { + "epoch": 0.23759027857388512, + "grad_norm": 20.134343986739584, + "learning_rate": 8.912193948611824e-07, + "loss": 0.483488655090332, + "step": 8290 + }, + { + "epoch": 0.23773357789751232, + "grad_norm": 14.766731201882958, + "learning_rate": 8.910748442264646e-07, + "loss": 0.4744230270385742, + "step": 8295 + }, + { + "epoch": 0.2378768772211395, + "grad_norm": 14.177121639055203, + "learning_rate": 8.909302093532538e-07, + "loss": 0.4881305694580078, + "step": 8300 + }, + { + "epoch": 0.2380201765447667, + "grad_norm": 19.82997882066246, + "learning_rate": 8.907854902727044e-07, + "loss": 0.4753118991851807, + "step": 8305 + }, + { + "epoch": 0.2381634758683939, + "grad_norm": 19.89396975719346, + "learning_rate": 8.90640687015989e-07, + "loss": 0.4875030040740967, + "step": 8310 + }, + { + "epoch": 0.2383067751920211, + "grad_norm": 18.25645973152032, + "learning_rate": 8.90495799614299e-07, + "loss": 0.4874722003936768, + "step": 8315 + }, + { + "epoch": 0.23845007451564829, + "grad_norm": 17.672870599834468, + "learning_rate": 8.903508280988435e-07, + "loss": 0.4832621097564697, + "step": 8320 + }, + { + "epoch": 0.23859337383927548, + "grad_norm": 9.064030801706474, + "learning_rate": 8.902057725008494e-07, + "loss": 0.5058441162109375, + "step": 8325 + }, + { + "epoch": 0.23873667316290267, + "grad_norm": 16.73625658266338, + "learning_rate": 8.900606328515623e-07, + "loss": 0.4824173927307129, + "step": 8330 + }, + { + "epoch": 0.23887997248652987, + "grad_norm": 14.101715665070728, + "learning_rate": 8.899154091822454e-07, + "loss": 0.48769345283508303, + "step": 8335 + }, + { + "epoch": 0.23902327181015706, + "grad_norm": 23.28186627210916, + "learning_rate": 8.897701015241805e-07, + "loss": 0.5023556232452393, + "step": 8340 + }, + { + "epoch": 0.23916657113378426, + "grad_norm": 22.29266491409156, + "learning_rate": 8.896247099086671e-07, + "loss": 0.4870613098144531, + "step": 8345 + }, + { + "epoch": 0.23930987045741145, + "grad_norm": 43.01326513924056, + "learning_rate": 8.894792343670229e-07, + "loss": 0.47840027809143065, + "step": 8350 + }, + { + "epoch": 0.23945316978103864, + "grad_norm": 23.15784616334062, + "learning_rate": 8.893336749305839e-07, + "loss": 0.4622639656066895, + "step": 8355 + }, + { + "epoch": 0.23959646910466584, + "grad_norm": 13.490789906201572, + "learning_rate": 8.891880316307038e-07, + "loss": 0.4724151611328125, + "step": 8360 + }, + { + "epoch": 0.23973976842829303, + "grad_norm": 21.42949237664404, + "learning_rate": 8.890423044987544e-07, + "loss": 0.48725380897521975, + "step": 8365 + }, + { + "epoch": 0.2398830677519202, + "grad_norm": 13.324600379949445, + "learning_rate": 8.888964935661259e-07, + "loss": 0.45373167991638186, + "step": 8370 + }, + { + "epoch": 0.2400263670755474, + "grad_norm": 23.22106677644094, + "learning_rate": 8.887505988642261e-07, + "loss": 0.47422990798950193, + "step": 8375 + }, + { + "epoch": 0.2401696663991746, + "grad_norm": 13.311034202942567, + "learning_rate": 8.886046204244813e-07, + "loss": 0.5120612144470215, + "step": 8380 + }, + { + "epoch": 0.24031296572280178, + "grad_norm": 15.530981546396163, + "learning_rate": 8.884585582783355e-07, + "loss": 0.45241923332214357, + "step": 8385 + }, + { + "epoch": 0.24045626504642897, + "grad_norm": 11.962447642135086, + "learning_rate": 8.88312412457251e-07, + "loss": 0.43743114471435546, + "step": 8390 + }, + { + "epoch": 0.24059956437005617, + "grad_norm": 13.623916111241263, + "learning_rate": 8.881661829927079e-07, + "loss": 0.4627070426940918, + "step": 8395 + }, + { + "epoch": 0.24074286369368336, + "grad_norm": 21.39729635209774, + "learning_rate": 8.880198699162043e-07, + "loss": 0.45392370223999023, + "step": 8400 + }, + { + "epoch": 0.24074286369368336, + "eval_bfov_iou": 0.7994859434858498, + "eval_bfov_iou@0.1": 0.952, + "eval_bfov_iou@0.25": 0.936, + "eval_bfov_iou@0.5": 0.924, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.6257142857142857, + "eval_exact_match": 0.3, + "eval_invalid_choice_rate": 0.005714285714285714, + "eval_runtime": 796.7404, + "eval_samples_per_second": 2.51, + "eval_steps_per_second": 0.079, + "eval_task_acc_absolute_direction_mc": 0.88, + "eval_task_acc_camera_rotation_transform_mc": 0.636, + "eval_task_acc_object_conditioned_reorientation_mc": 0.54, + "eval_task_acc_observer_distance_choice": 0.588, + "eval_task_acc_relative_3d_position_mc": 0.5, + "eval_task_acc_relative_direction_mc": 0.572, + "eval_task_acc_seam_continuity_mc": 0.664, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.952, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.936, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.924, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7994859434858498, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 8400 + }, + { + "epoch": 0.24088616301731056, + "grad_norm": 19.95549726577489, + "learning_rate": 8.878734732592565e-07, + "loss": 0.4472762107849121, + "step": 8405 + }, + { + "epoch": 0.24102946234093775, + "grad_norm": 17.531412387027725, + "learning_rate": 8.877269930533986e-07, + "loss": 0.4846649646759033, + "step": 8410 + }, + { + "epoch": 0.24117276166456494, + "grad_norm": 28.34186547512898, + "learning_rate": 8.875804293301829e-07, + "loss": 0.4299349308013916, + "step": 8415 + }, + { + "epoch": 0.24131606098819214, + "grad_norm": 15.257284816204319, + "learning_rate": 8.874337821211795e-07, + "loss": 0.4456326007843018, + "step": 8420 + }, + { + "epoch": 0.24145936031181933, + "grad_norm": 24.232964051311697, + "learning_rate": 8.872870514579766e-07, + "loss": 0.47241792678833006, + "step": 8425 + }, + { + "epoch": 0.24160265963544653, + "grad_norm": 21.05190972773464, + "learning_rate": 8.871402373721805e-07, + "loss": 0.4882339000701904, + "step": 8430 + }, + { + "epoch": 0.24174595895907372, + "grad_norm": 22.15819487995056, + "learning_rate": 8.869933398954152e-07, + "loss": 0.4914100646972656, + "step": 8435 + }, + { + "epoch": 0.24188925828270091, + "grad_norm": 16.914343813761487, + "learning_rate": 8.868463590593228e-07, + "loss": 0.5023339271545411, + "step": 8440 + }, + { + "epoch": 0.2420325576063281, + "grad_norm": 14.443711585467469, + "learning_rate": 8.866992948955632e-07, + "loss": 0.4727160453796387, + "step": 8445 + }, + { + "epoch": 0.2421758569299553, + "grad_norm": 28.473457797725718, + "learning_rate": 8.865521474358144e-07, + "loss": 0.4627984046936035, + "step": 8450 + }, + { + "epoch": 0.2423191562535825, + "grad_norm": 37.577062131382405, + "learning_rate": 8.864049167117726e-07, + "loss": 0.48152875900268555, + "step": 8455 + }, + { + "epoch": 0.24246245557720966, + "grad_norm": 29.214152191852037, + "learning_rate": 8.862576027551515e-07, + "loss": 0.4751421928405762, + "step": 8460 + }, + { + "epoch": 0.24260575490083686, + "grad_norm": 19.603299361130404, + "learning_rate": 8.861102055976828e-07, + "loss": 0.4393308162689209, + "step": 8465 + }, + { + "epoch": 0.24274905422446405, + "grad_norm": 14.385281191063637, + "learning_rate": 8.859627252711164e-07, + "loss": 0.44484567642211914, + "step": 8470 + }, + { + "epoch": 0.24289235354809124, + "grad_norm": 17.50009087901389, + "learning_rate": 8.858151618072199e-07, + "loss": 0.5198230266571044, + "step": 8475 + }, + { + "epoch": 0.24303565287171844, + "grad_norm": 90.23355218414213, + "learning_rate": 8.856675152377786e-07, + "loss": 0.48792028427124023, + "step": 8480 + }, + { + "epoch": 0.24317895219534563, + "grad_norm": 14.707469777788491, + "learning_rate": 8.855197855945962e-07, + "loss": 0.5015013217926025, + "step": 8485 + }, + { + "epoch": 0.24332225151897283, + "grad_norm": 12.814625114905692, + "learning_rate": 8.853719729094939e-07, + "loss": 0.4748403072357178, + "step": 8490 + }, + { + "epoch": 0.24346555084260002, + "grad_norm": 15.735849182344706, + "learning_rate": 8.852240772143109e-07, + "loss": 0.466131591796875, + "step": 8495 + }, + { + "epoch": 0.24360885016622721, + "grad_norm": 16.422398601815097, + "learning_rate": 8.850760985409045e-07, + "loss": 0.47098493576049805, + "step": 8500 + }, + { + "epoch": 0.2437521494898544, + "grad_norm": 13.669100469598678, + "learning_rate": 8.849280369211493e-07, + "loss": 0.49321613311767576, + "step": 8505 + }, + { + "epoch": 0.2438954488134816, + "grad_norm": 13.956196164087276, + "learning_rate": 8.847798923869386e-07, + "loss": 0.460036039352417, + "step": 8510 + }, + { + "epoch": 0.2440387481371088, + "grad_norm": 14.708806395272243, + "learning_rate": 8.846316649701828e-07, + "loss": 0.4613286018371582, + "step": 8515 + }, + { + "epoch": 0.244182047460736, + "grad_norm": 13.050486416233952, + "learning_rate": 8.844833547028106e-07, + "loss": 0.44948129653930663, + "step": 8520 + }, + { + "epoch": 0.24432534678436318, + "grad_norm": 18.731894024153117, + "learning_rate": 8.843349616167681e-07, + "loss": 0.4623112678527832, + "step": 8525 + }, + { + "epoch": 0.24446864610799038, + "grad_norm": 24.66361886116018, + "learning_rate": 8.8418648574402e-07, + "loss": 0.45687217712402345, + "step": 8530 + }, + { + "epoch": 0.24461194543161757, + "grad_norm": 27.428760788286713, + "learning_rate": 8.84037927116548e-07, + "loss": 0.49613280296325685, + "step": 8535 + }, + { + "epoch": 0.24475524475524477, + "grad_norm": 18.583835027846476, + "learning_rate": 8.838892857663522e-07, + "loss": 0.45428924560546874, + "step": 8540 + }, + { + "epoch": 0.24489854407887196, + "grad_norm": 11.713539890540533, + "learning_rate": 8.837405617254503e-07, + "loss": 0.47220478057861326, + "step": 8545 + }, + { + "epoch": 0.24504184340249913, + "grad_norm": 14.939191359198684, + "learning_rate": 8.835917550258777e-07, + "loss": 0.4493133544921875, + "step": 8550 + }, + { + "epoch": 0.24518514272612632, + "grad_norm": 14.695929007322317, + "learning_rate": 8.834428656996878e-07, + "loss": 0.4787053108215332, + "step": 8555 + }, + { + "epoch": 0.24532844204975351, + "grad_norm": 15.740183598818998, + "learning_rate": 8.832938937789518e-07, + "loss": 0.41716604232788085, + "step": 8560 + }, + { + "epoch": 0.2454717413733807, + "grad_norm": 18.122231810508755, + "learning_rate": 8.831448392957586e-07, + "loss": 0.48280086517333987, + "step": 8565 + }, + { + "epoch": 0.2456150406970079, + "grad_norm": 18.338946845106218, + "learning_rate": 8.829957022822148e-07, + "loss": 0.49134387969970705, + "step": 8570 + }, + { + "epoch": 0.2457583400206351, + "grad_norm": 24.991749962195673, + "learning_rate": 8.82846482770445e-07, + "loss": 0.4818402290344238, + "step": 8575 + }, + { + "epoch": 0.2459016393442623, + "grad_norm": 14.314171855055154, + "learning_rate": 8.826971807925914e-07, + "loss": 0.45925049781799315, + "step": 8580 + }, + { + "epoch": 0.24604493866788948, + "grad_norm": 24.042425596804748, + "learning_rate": 8.825477963808139e-07, + "loss": 0.497023868560791, + "step": 8585 + }, + { + "epoch": 0.24618823799151668, + "grad_norm": 18.160437355181887, + "learning_rate": 8.823983295672906e-07, + "loss": 0.45731124877929685, + "step": 8590 + }, + { + "epoch": 0.24633153731514387, + "grad_norm": 17.152899869111266, + "learning_rate": 8.822487803842167e-07, + "loss": 0.4682442665100098, + "step": 8595 + }, + { + "epoch": 0.24647483663877107, + "grad_norm": 12.794697400843587, + "learning_rate": 8.820991488638057e-07, + "loss": 0.4369030952453613, + "step": 8600 + }, + { + "epoch": 0.24661813596239826, + "grad_norm": 17.085402877872127, + "learning_rate": 8.819494350382884e-07, + "loss": 0.5028247356414794, + "step": 8605 + }, + { + "epoch": 0.24676143528602545, + "grad_norm": 11.941404058875886, + "learning_rate": 8.817996389399136e-07, + "loss": 0.4928277492523193, + "step": 8610 + }, + { + "epoch": 0.24690473460965265, + "grad_norm": 17.965149334438248, + "learning_rate": 8.816497606009478e-07, + "loss": 0.4769721984863281, + "step": 8615 + }, + { + "epoch": 0.24704803393327984, + "grad_norm": 20.35880327043565, + "learning_rate": 8.814998000536751e-07, + "loss": 0.47005863189697267, + "step": 8620 + }, + { + "epoch": 0.24719133325690704, + "grad_norm": 14.121652863948581, + "learning_rate": 8.813497573303974e-07, + "loss": 0.4934974670410156, + "step": 8625 + }, + { + "epoch": 0.24733463258053423, + "grad_norm": 12.501648733931471, + "learning_rate": 8.811996324634345e-07, + "loss": 0.467899227142334, + "step": 8630 + }, + { + "epoch": 0.24747793190416142, + "grad_norm": 12.845717864343209, + "learning_rate": 8.810494254851232e-07, + "loss": 0.4604206085205078, + "step": 8635 + }, + { + "epoch": 0.24762123122778862, + "grad_norm": 10.776563710378676, + "learning_rate": 8.808991364278189e-07, + "loss": 0.4132228374481201, + "step": 8640 + }, + { + "epoch": 0.24776453055141578, + "grad_norm": 32.5534068035484, + "learning_rate": 8.807487653238938e-07, + "loss": 0.4910059928894043, + "step": 8645 + }, + { + "epoch": 0.24790782987504298, + "grad_norm": 14.613317806047245, + "learning_rate": 8.805983122057388e-07, + "loss": 0.482450008392334, + "step": 8650 + }, + { + "epoch": 0.24805112919867017, + "grad_norm": 16.06654339675983, + "learning_rate": 8.804477771057612e-07, + "loss": 0.5050084114074707, + "step": 8655 + }, + { + "epoch": 0.24819442852229737, + "grad_norm": 13.346165983468826, + "learning_rate": 8.802971600563873e-07, + "loss": 0.44519824981689454, + "step": 8660 + }, + { + "epoch": 0.24833772784592456, + "grad_norm": 17.146592863303916, + "learning_rate": 8.801464610900597e-07, + "loss": 0.46198129653930664, + "step": 8665 + }, + { + "epoch": 0.24848102716955175, + "grad_norm": 13.035343742971964, + "learning_rate": 8.7999568023924e-07, + "loss": 0.46451506614685056, + "step": 8670 + }, + { + "epoch": 0.24862432649317895, + "grad_norm": 12.221471186666351, + "learning_rate": 8.798448175364064e-07, + "loss": 0.4737973213195801, + "step": 8675 + }, + { + "epoch": 0.24876762581680614, + "grad_norm": 18.932413737610492, + "learning_rate": 8.796938730140551e-07, + "loss": 0.483095645904541, + "step": 8680 + }, + { + "epoch": 0.24891092514043334, + "grad_norm": 24.133207878238323, + "learning_rate": 8.795428467047e-07, + "loss": 0.4507643222808838, + "step": 8685 + }, + { + "epoch": 0.24905422446406053, + "grad_norm": 13.9769043183638, + "learning_rate": 8.793917386408724e-07, + "loss": 0.4471887588500977, + "step": 8690 + }, + { + "epoch": 0.24919752378768772, + "grad_norm": 12.009229260463934, + "learning_rate": 8.792405488551216e-07, + "loss": 0.4888181686401367, + "step": 8695 + }, + { + "epoch": 0.24934082311131492, + "grad_norm": 32.858659536720324, + "learning_rate": 8.790892773800142e-07, + "loss": 0.41931972503662107, + "step": 8700 + }, + { + "epoch": 0.24934082311131492, + "eval_bfov_iou": 0.7857576270223217, + "eval_bfov_iou@0.1": 0.96, + "eval_bfov_iou@0.25": 0.956, + "eval_bfov_iou@0.5": 0.952, + "eval_bfov_valid_rate": 1.0, + "eval_choice_accuracy": 0.6588571428571428, + "eval_exact_match": 0.2205, + "eval_invalid_choice_rate": 0.027428571428571427, + "eval_runtime": 1341.3095, + "eval_samples_per_second": 1.491, + "eval_steps_per_second": 0.047, + "eval_task_acc_absolute_direction_mc": 0.872, + "eval_task_acc_camera_rotation_transform_mc": 0.772, + "eval_task_acc_object_conditioned_reorientation_mc": 0.588, + "eval_task_acc_observer_distance_choice": 0.58, + "eval_task_acc_relative_3d_position_mc": 0.568, + "eval_task_acc_relative_direction_mc": 0.552, + "eval_task_acc_seam_continuity_mc": 0.68, + "eval_task_bfov_count_referring_grounding_bfov": 250.0, + "eval_task_bfov_iou@0.1_referring_grounding_bfov": 0.96, + "eval_task_bfov_iou@0.25_referring_grounding_bfov": 0.956, + "eval_task_bfov_iou@0.5_referring_grounding_bfov": 0.952, + "eval_task_bfov_iou_referring_grounding_bfov": 0.7857576270223217, + "eval_task_bfov_valid_rate_referring_grounding_bfov": 1.0, + "eval_task_count_absolute_direction_mc": 250.0, + "eval_task_count_camera_rotation_transform_mc": 250.0, + "eval_task_count_object_conditioned_reorientation_mc": 250.0, + "eval_task_count_observer_distance_choice": 250.0, + "eval_task_count_relative_3d_position_mc": 250.0, + "eval_task_count_relative_direction_mc": 250.0, + "eval_task_count_seam_continuity_mc": 250.0, + "step": 8700 + } + ], + "logging_steps": 5, + "max_steps": 34892, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 300, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2.0008720071131136e+16, + "train_batch_size": 2, + "trial_name": null, + "trial_params": null +}